diff --git a/.github/actions/common_setup/action.yml b/.github/actions/common_setup/action.yml
index b02413adc44..e492fa97816 100644
--- a/.github/actions/common_setup/action.yml
+++ b/.github/actions/common_setup/action.yml
@@ -18,9 +18,6 @@ runs:
           echo "Setup the common ENV variables"
           cat >> "$GITHUB_ENV" << 'EOF'
           TEMP_PATH=${{runner.temp}}/${{inputs.job_type}}
-          REPO_COPY=${{runner.temp}}/${{inputs.job_type}}/git-repo-copy
-          IMAGES_PATH=${{runner.temp}}/images_path
-          REPORTS_PATH=${{runner.temp}}/reports_dir
           EOF
           if [ -z "${{env.GITHUB_JOB_OVERRIDDEN}}" ] && [ "true" == "${{inputs.nested_job}}" ]; then
             echo "The GITHUB_JOB_OVERRIDDEN ENV is unset, and must be set for the nested jobs"
@@ -30,6 +27,4 @@ runs:
       shell: bash
       run: |
           # to remove every leftovers
-          sudo rm -fr "$TEMP_PATH"
-          mkdir -p "$REPO_COPY"
-          cp -a "$GITHUB_WORKSPACE"/. "$REPO_COPY"/
+          sudo rm -fr "$TEMP_PATH" && mkdir -p "$TEMP_PATH"
diff --git a/.github/workflows/backport_branches.yml b/.github/workflows/backport_branches.yml
index f6af4778cf1..ef554a1b0ff 100644
--- a/.github/workflows/backport_branches.yml
+++ b/.github/workflows/backport_branches.yml
@@ -10,27 +10,21 @@ on: # yamllint disable-line rule:truthy
     branches:
       - 'backport/**'
 jobs:
-  CheckLabels:
+  RunConfig:
     runs-on: [self-hosted, style-checker]
-    # Run the first check always, even if the CI is cancelled
-    if: ${{ always() }}
+    outputs:
+      data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
-          clear-repository: true
+          clear-repository: true # to ensure correct digests
+          fetch-depth: 0 # to get version
+          filter: tree:0
       - name: Labels check
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
           python3 run_check.py
-  PythonUnitTests:
-    runs-on: [self-hosted, style-checker]
-    needs: CheckLabels
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
       - name: Python unit tests
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
@@ -40,273 +34,237 @@ jobs:
             echo "Testing $dir"
             python3 -m unittest discover -s "$dir" -p 'test_*.py'
           done
-  DockerHubPushAarch64:
-    runs-on: [self-hosted, style-checker-aarch64]
-    needs: CheckLabels
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
+      - name: PrepareRunConfig
+        id: runconfig
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_aarch64.json
-  DockerHubPushAmd64:
-    runs-on: [self-hosted, style-checker]
-    needs: CheckLabels
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
+            echo "::group::configure CI run"
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --outfile ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            echo "::group::CI run configure results"
+            python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            {
+              echo 'CI_DATA<<EOF'
+              cat  ${{ runner.temp }}/ci_run_data.json
+              echo 'EOF'
+            } >> "$GITHUB_OUTPUT"
+      - name: Re-create GH statuses for skipped jobs if any
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix amd64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_amd64.json
-  DockerHubPush:
-    needs: [DockerHubPushAmd64, DockerHubPushAarch64, PythonUnitTests]
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # to find ancestor merge commits necessary for finding proper docker tags
-          filter: tree:0
-      - name: Download changed aarch64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}
-      - name: Download changed amd64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images
-          path: ${{ runner.temp }}/changed_images.json
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ runner.temp }}/ci_run_data.json --update-gh-statuses
+  BuildDockers:
+    needs: [RunConfig]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_docker.yml
+    with:
+      data: ${{ needs.RunConfig.outputs.data }}
   CompatibilityCheckX86:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (amd64)" --check-glibc --check-distributions
   CompatibilityCheckAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (aarch64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (aarch64)" --check-glibc
 #########################################################################################
 #################################### ORDINARY BUILDS ####################################
 #########################################################################################
   BuilderDebRelease:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_release
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAarch64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_aarch64
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_asan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebTsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_tsan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebDebug:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_debug
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinDarwin:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinDarwinAarch64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin_aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
   DockerServerImages:
-    needs:
-      - BuilderDebRelease
-      - BuilderDebAarch64
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
-          filter: tree:0
-      - name: Check docker clickhouse/clickhouse-server building
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_server.py --release-type head --no-push \
-            --image-repo clickhouse/clickhouse-server --image-path docker/server
-          python3 docker_server.py --release-type head --no-push \
-            --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper
-      - name: Cleanup
-        if: always()
-        run: |
-          docker ps --quiet | xargs --no-run-if-empty docker kill ||:
-          docker ps --all --quiet | xargs --no-run-if-empty docker rm -f ||:
-          sudo rm -fr "$TEMP_PATH"
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker server and keeper images
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
+      run_command: |
+        cd "$GITHUB_WORKSPACE/tests/ci"
+        python3 docker_server.py --release-type head --no-push \
+          --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+        python3 docker_server.py --release-type head --no-push \
+          --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
 ##################################### BUILD REPORTER #######################################
 ############################################################################################
   BuilderReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
-      - BuilderDebRelease
+      - RunConfig
       - BuilderDebAarch64
       - BuilderDebAsan
-      - BuilderDebTsan
       - BuilderDebDebug
+      - BuilderDebRelease
+      - BuilderDebTsan
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: ClickHouse build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
   BuilderSpecialReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
+      - RunConfig
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: ClickHouse special build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
 ############################################################################################
 #################################### INSTALL PACKAGES ######################################
 ############################################################################################
   InstallPackagesTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
   InstallPackagesTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (arm64)
       runner_type: style-checker-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
 ##############################################################################################
 ########################### FUNCTIONAl STATELESS TESTS #######################################
 ##############################################################################################
   FunctionalStatelessTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (asan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ############################ FUNCTIONAl STATEFUL TESTS #######################################
 ##############################################################################################
   FunctionalStatefulTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (debug)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ######################################### STRESS TESTS #######################################
 ##############################################################################################
   StressTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (tsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 ############################# INTEGRATION TESTS #############################################
 #############################################################################################
   IntegrationTestsRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (release)
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   FinishCheck:
+    if: ${{ !failure() && !cancelled() }}
     needs:
-      - DockerHubPush
-      - DockerServerImages
       - BuilderReport
       - BuilderSpecialReport
       - FunctionalStatelessTestAsan
diff --git a/.github/workflows/docs_check.yml b/.github/workflows/docs_check.yml
deleted file mode 100644
index 6d449e74f30..00000000000
--- a/.github/workflows/docs_check.yml
+++ /dev/null
@@ -1,138 +0,0 @@
-name: DocsCheck
-
-env:
-  # Force the stdout and stderr streams to be unbuffered
-  PYTHONUNBUFFERED: 1
-
-on:  # yamllint disable-line rule:truthy
-  pull_request:
-    types:
-      - synchronize
-      - reopened
-      - opened
-    branches:
-      - master
-    paths:
-      - '**.md'
-      - 'docker/docs/**'
-      - 'docs/**'
-      - 'utils/check-style/aspell-ignore/**'
-      - 'tests/ci/docs_check.py'
-      - '.github/workflows/docs_check.yml'
-jobs:
-  CheckLabels:
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Labels check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 run_check.py
-  DockerHubPushAarch64:
-    needs: CheckLabels
-    runs-on: [self-hosted, style-checker-aarch64]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_aarch64.json
-  DockerHubPushAmd64:
-    needs: CheckLabels
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix amd64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_amd64.json
-  DockerHubPush:
-    needs: [DockerHubPushAmd64, DockerHubPushAarch64]
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # to find ancestor merge commits necessary for finding proper docker tags
-          filter: tree:0
-      - name: Download changed aarch64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}
-      - name: Download changed amd64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images
-          path: ${{ runner.temp }}/changed_images.json
-  StyleCheck:
-    needs: DockerHubPush
-    # We need additional `&& ! cancelled()` to have the job being able to cancel
-    if: ${{ success() || failure() || ( always() && ! cancelled() ) }}
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Style check
-      runner_type: style-checker
-      run_command: |
-          cd "$REPO_COPY/tests/ci"
-          python3 style_check.py
-    secrets:
-      secret_envs: |
-        ROBOT_CLICKHOUSE_SSH_KEY<<RCSK
-        ${{secrets.ROBOT_CLICKHOUSE_SSH_KEY}}
-        RCSK
-  DocsCheck:
-    needs: DockerHubPush
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Docs check
-      runner_type: func-tester-aarch64
-      additional_envs: |
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 docs_check.py
-  FinishCheck:
-    needs:
-      - StyleCheck
-      - DockerHubPush
-      - DocsCheck
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Finish label
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 finish_check.py
-          python3 merge_pr.py --check-approved
diff --git a/.github/workflows/jepsen.yml b/.github/workflows/jepsen.yml
index 163de7769af..50118eaf622 100644
--- a/.github/workflows/jepsen.yml
+++ b/.github/workflows/jepsen.yml
@@ -11,16 +11,14 @@ on: # yamllint disable-line rule:truthy
   workflow_call:
 jobs:
   KeeperJepsenRelease:
-    uses: ./.github/workflows/reusable_test.yml
+    uses: ./.github/workflows/reusable_simple_job.yml
     with:
       test_name: Jepsen keeper check
       runner_type: style-checker
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 jepsen_check.py keeper
   # ServerJepsenRelease:
-  #   runs-on: [self-hosted, style-checker]
-  #   uses: ./.github/workflows/reusable_test.yml
+  #   uses: ./.github/workflows/reusable_simple_job.yml
   #   with:
   #     test_name: Jepsen server check
   #     runner_type: style-checker
diff --git a/.github/workflows/libfuzzer.yml b/.github/workflows/libfuzzer.yml
index 1ca637c0d84..062ba99a893 100644
--- a/.github/workflows/libfuzzer.yml
+++ b/.github/workflows/libfuzzer.yml
@@ -8,19 +8,26 @@ on: # yamllint disable-line rule:truthy
   #  schedule:
   #    - cron: '0 0 2 31 1' # never for now
   workflow_call:
+    inputs:
+      data:
+        description: json ci data
+        type: string
+        required: true
+
 jobs:
   BuilderFuzzers:
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: fuzzers
+      data: ${{ inputs.data }}
   libFuzzerTest:
     needs: [BuilderFuzzers]
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: libFuzzer tests
       runner_type: func-tester
+      data: ${{ inputs.data }}
       additional_envs: |
         KILL_TIMEOUT=10800
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 libfuzzer_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
diff --git a/.github/workflows/master.yml b/.github/workflows/master.yml
index e662a5b6f98..d2865eb737d 100644
--- a/.github/workflows/master.yml
+++ b/.github/workflows/master.yml
@@ -10,13 +10,17 @@ on: # yamllint disable-line rule:truthy
     branches:
       - 'master'
 jobs:
-  PythonUnitTests:
+  RunConfig:
     runs-on: [self-hosted, style-checker]
+    outputs:
+      data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
-          clear-repository: true
+          clear-repository: true # to ensure correct digests
+          fetch-depth: 0 # to get version
+          filter: tree:0
       - name: Python unit tests
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
@@ -26,237 +30,242 @@ jobs:
             echo "Testing $dir"
             python3 -m unittest discover -s "$dir" -p 'test_*.py'
           done
-  DockerHubPushAarch64:
-    runs-on: [self-hosted, style-checker-aarch64]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
+      - name: PrepareRunConfig
+        id: runconfig
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_aarch64.json
-  DockerHubPushAmd64:
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
+            echo "::group::configure CI run"
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --rebuild-all-binaries --outfile ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            echo "::group::CI run configure results"
+            python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            {
+              echo 'CI_DATA<<EOF'
+              cat  ${{ runner.temp }}/ci_run_data.json
+              echo 'EOF'
+            } >> "$GITHUB_OUTPUT"
+      - name: Re-create GH statuses for skipped jobs if any
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix amd64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_amd64.json
-  DockerHubPush:
-    needs: [DockerHubPushAmd64, DockerHubPushAarch64, PythonUnitTests]
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # to find ancestor merge commits necessary for finding proper docker tags
-          filter: tree:0
-      - name: Download changed aarch64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}
-      - name: Download changed amd64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images
-          path: ${{ runner.temp }}/changed_images.json
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ runner.temp }}/ci_run_data.json --update-gh-statuses
+  BuildDockers:
+    needs: [RunConfig]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_docker.yml
+    with:
+      data: ${{ needs.RunConfig.outputs.data }}
+      set_latest: true
   StyleCheck:
-    needs: DockerHubPush
-    if: ${{ success() || failure() }}
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Style check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-          cd "$REPO_COPY/tests/ci"
           python3 style_check.py --no-push
   CompatibilityCheckX86:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (amd64)" --check-glibc --check-distributions
   CompatibilityCheckAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (aarch64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (aarch64)" --check-glibc
 #########################################################################################
 #################################### ORDINARY BUILDS ####################################
 #########################################################################################
+# TODO: never skip builds!
   BuilderDebRelease:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
-      checkout_depth: 0
       build_name: package_release
+      checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAarch64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
-      checkout_depth: 0
       build_name: package_aarch64
+      checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinRelease:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
-      checkout_depth: 0
       build_name: binary_release
+      checkout_depth: 0 # otherwise we will have no info about contributors
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_asan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebUBsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_ubsan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebTsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_tsan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebMsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_msan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebDebug:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_debug
+      data: ${{ needs.RunConfig.outputs.data }}
 ##########################################################################################
 ##################################### SPECIAL BUILDS #####################################
 ##########################################################################################
   BuilderBinClangTidy:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_tidy
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinDarwin:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinAarch64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinFreeBSD:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_freebsd
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinDarwinAarch64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin_aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinPPC64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_ppc64le
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinAmd64Compat:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_amd64_compat
+      data: ${{ needs.RunConfig.outputs.data }}
+      checkout_depth: 0
+  BuilderBinAmd64Musl:
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_build.yml
+    with:
+      build_name: binary_amd64_musl
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinAarch64V80Compat:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_aarch64_v80compat
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinRISCV64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_riscv64
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
   BuilderBinS390X:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_s390x
+      data: ${{ needs.RunConfig.outputs.data }}
       checkout_depth: 0
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
   DockerServerImages:
-    needs:
-      - BuilderDebRelease
-      - BuilderDebAarch64
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
-          filter: tree:0
-      - name: Check docker clickhouse/clickhouse-server building
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_server.py --release-type head \
-            --image-repo clickhouse/clickhouse-server --image-path docker/server
-          python3 docker_server.py --release-type head \
-            --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper
-      - name: Cleanup
-        if: always()
-        run: |
-          docker ps --quiet | xargs --no-run-if-empty docker kill ||:
-          docker ps --all --quiet | xargs --no-run-if-empty docker rm -f ||:
-          sudo rm -fr "$TEMP_PATH"
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker server and keeper images
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      # FIXME: avoid using 0 checkout
+      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
+      run_command: |
+        cd "$GITHUB_WORKSPACE/tests/ci"
+        python3 docker_server.py --release-type head \
+          --image-repo clickhouse/clickhouse-server --image-path docker/server
+        python3 docker_server.py --release-type head \
+          --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper
 ############################################################################################
 ##################################### BUILD REPORTER #######################################
 ############################################################################################
   BuilderReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
+      - RunConfig
       - BuilderBinRelease
       - BuilderDebAarch64
       - BuilderDebAsan
@@ -269,16 +278,18 @@ jobs:
     with:
       test_name: ClickHouse build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
   BuilderSpecialReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
+      - RunConfig
       - BuilderBinAarch64
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64
@@ -289,18 +300,20 @@ jobs:
       - BuilderBinAmd64Compat
       - BuilderBinAarch64V80Compat
       - BuilderBinClangTidy
+      - BuilderBinAmd64Musl
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: ClickHouse special build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
   MarkReleaseReady:
+    if: ${{ !failure() && !cancelled() }}
     needs:
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64
@@ -320,470 +333,404 @@ jobs:
 #################################### INSTALL PACKAGES ######################################
 ############################################################################################
   InstallPackagesTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
   InstallPackagesTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (arm64)
       runner_type: style-checker-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
 ##############################################################################################
 ########################### FUNCTIONAl STATELESS TESTS #######################################
 ##############################################################################################
   FunctionalStatelessTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseOrdinary:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release, DatabaseOrdinary)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseReplicated:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release, DatabaseReplicated)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
-  FunctionalStatelessTestReleaseS3:
-    needs: [BuilderDebRelease]
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateless tests (release, s3 storage)
-      runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 2
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseAnalyzer:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release, analyzer)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatelessTestReleaseS3:
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateless tests (release, s3 storage)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (aarch64)
       runner_type: func-tester-aarch64
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (asan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
+
   FunctionalStatelessTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (tsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 5
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
-  FunctionalStatelessTestUBsan:
-    needs: [BuilderDebUBsan]
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateless tests (ubsan)
-      runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 2
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (msan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatelessTestUBsan:
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateless tests (ubsan)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (debug)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 5
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ############################ FUNCTIONAl STATEFUL TESTS #######################################
 ##############################################################################################
   FunctionalStatefulTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (release)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (aarch64)
       runner_type: func-tester-aarch64
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (asan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (tsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (msan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (ubsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (debug)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
+      data: ${{ needs.RunConfig.outputs.data }}
+##############################################################################################
+########################### ClickBench #######################################################
+##############################################################################################
+  ClickBenchAMD64:
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: ClickBench (amd64)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+        python3 clickbench.py "$CHECK_NAME"
+  ClickBenchAarch64:
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: ClickBench (aarch64)
+      runner_type: func-tester-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
+        python3 clickbench.py "$CHECK_NAME"
 ##############################################################################################
 ######################################### STRESS TESTS #######################################
 ##############################################################################################
   StressTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (asan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (tsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (msan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (ubsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (debug)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 ############################# INTEGRATION TESTS #############################################
 #############################################################################################
   IntegrationTestsAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (asan)
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsAnalyzerAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (asan, analyzer)
       runner_type: stress-tester
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (tsan)
       runner_type: stress-tester
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (release)
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ##################################### AST FUZZERS ############################################
 ##############################################################################################
   ASTFuzzerTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (asan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (tsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestUBSan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (ubsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestMSan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (msan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (debug)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 #################################### UNIT TESTS #############################################
 #############################################################################################
   UnitTestsAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (asan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsReleaseClang:
-    needs: [BuilderBinRelease]
+    needs: [RunConfig, BuilderBinRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (release)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (tsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (msan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (ubsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 #################################### PERFORMANCE TESTS ######################################
 #############################################################################################
   PerformanceComparisonX86:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Performance Comparison
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 performance_comparison_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   PerformanceComparisonAarch:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Performance Comparison Aarch64
       runner_type: func-tester-aarch64
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 performance_comparison_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ###################################### SQLANCER FUZZERS ######################################
 ##############################################################################################
   SQLancerTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: SQLancer (release)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 sqlancer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   SQLancerTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: SQLancer (debug)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 sqlancer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   FinishCheck:
+    if: ${{ !failure() && !cancelled() }}
     needs:
-      - DockerHubPush
-      - BuilderReport
-      - BuilderSpecialReport
       - MarkReleaseReady
       - FunctionalStatelessTestDebug
       - FunctionalStatelessTestRelease
diff --git a/.github/workflows/nightly.yml b/.github/workflows/nightly.yml
index 1e94f70b9e6..2774eae24cc 100644
--- a/.github/workflows/nightly.yml
+++ b/.github/workflows/nightly.yml
@@ -13,67 +13,38 @@ jobs:
   Debug:
     # The task for having a preserved ENV and event.json for later investigation
     uses: ./.github/workflows/debug.yml
-  DockerHubPushAarch64:
-    runs-on: [self-hosted, style-checker-aarch64]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix aarch64 --all
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_aarch64.json
-  DockerHubPushAmd64:
+  RunConfig:
     runs-on: [self-hosted, style-checker]
+    outputs:
+      data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
-          clear-repository: true
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix amd64 --all
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_amd64.json
-  DockerHubPush:
-    needs: [DockerHubPushAmd64, DockerHubPushAarch64]
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # to find ancestor merge commits necessary for finding proper docker tags
+          clear-repository: true # to ensure correct digests
+          fetch-depth: 0 # to get version
           filter: tree:0
-      - name: Download changed aarch64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}
-      - name: Download changed amd64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}
-      - name: Images check
+      - name: PrepareRunConfig
+        id: runconfig
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images
-          path: ${{ runner.temp }}/changed_images.json
+            echo "::group::configure CI run"
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --skip-jobs --rebuild-all-docker --outfile ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            echo "::group::CI run configure results"
+            python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+            {
+              echo 'CI_DATA<<EOF'
+              cat  ${{ runner.temp }}/ci_run_data.json
+              echo 'EOF'
+            } >> "$GITHUB_OUTPUT"
+  BuildDockers:
+    needs: [RunConfig]
+    uses: ./.github/workflows/reusable_docker.yml
+    with:
+      data: "${{ needs.RunConfig.outputs.data }}"
+      set_latest: true
   SonarCloud:
     runs-on: [self-hosted, builder]
     env:
diff --git a/.github/workflows/pull_request.yml b/.github/workflows/pull_request.yml
index c92fa52ed4e..bd2b2b60904 100644
--- a/.github/workflows/pull_request.yml
+++ b/.github/workflows/pull_request.yml
@@ -13,37 +13,25 @@ on:  # yamllint disable-line rule:truthy
       - opened
     branches:
       - master
-    paths-ignore:
-      - '**.md'
-      - 'docker/docs/**'
-      - 'docs/**'
-      - 'utils/check-style/aspell-ignore/**'
-      - 'tests/ci/docs_check.py'
-      - '.github/workflows/docs_check.yml'
 ##########################################################################################
 ##################################### SMALL CHECKS #######################################
 ##########################################################################################
 jobs:
-  CheckLabels:
+  RunConfig:
     runs-on: [self-hosted, style-checker]
-    # Run the first check always, even if the CI is cancelled
-    if: ${{ always() }}
+    outputs:
+      data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
-          clear-repository: true
+          clear-repository: true # to ensure correct digests
+          fetch-depth: 0 # to get version
+          filter: tree:0
       - name: Labels check
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
           python3 run_check.py
-  PythonUnitTests:
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
       - name: Python unit tests
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
@@ -53,244 +41,260 @@ jobs:
             echo "Testing $dir"
             python3 -m unittest discover -s "$dir" -p 'test_*.py'
           done
-  DockerHubPushAarch64:
-    needs: CheckLabels
-    runs-on: [self-hosted, style-checker-aarch64]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
+      - name: PrepareRunConfig
+        id: runconfig
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_aarch64.json
-  DockerHubPushAmd64:
-    needs: CheckLabels
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
+            echo "::group::configure CI run"
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --outfile ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            echo "::group::CI run configure results"
+            python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+
+            {
+              echo 'CI_DATA<<EOF'
+              cat  ${{ runner.temp }}/ci_run_data.json
+              echo 'EOF'
+            } >> "$GITHUB_OUTPUT"
+      - name: Re-create GH statuses for skipped jobs if any
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix amd64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_amd64.json
-  DockerHubPush:
-    needs: [DockerHubPushAmd64, DockerHubPushAarch64, PythonUnitTests]
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # to find ancestor merge commits necessary for finding proper docker tags
-          filter: tree:0
-      - name: Download changed aarch64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}
-      - name: Download changed amd64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}
-      - name: Images check
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ runner.temp }}/ci_run_data.json --update-gh-statuses
+      - name: Style check early
+        # hack to run style check before the docker build job if possible (style-check image not changed)
+        if: contains(fromJson(steps.runconfig.outputs.CI_DATA).jobs_data.jobs_to_do, 'Style check early')
         run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images
-          path: ${{ runner.temp }}/changed_images.json
+          DOCKER_TAG=$(echo '${{ toJson(fromJson(steps.runconfig.outputs.CI_DATA).docker_data.images) }}' | tr -d '\n')
+          export DOCKER_TAG=$DOCKER_TAG
+          python3 ./tests/ci/style_check.py --no-push
+  BuildDockers:
+    needs: [RunConfig]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_docker.yml
+    with:
+      data: ${{ needs.RunConfig.outputs.data }}
   StyleCheck:
-    needs: DockerHubPush
-    # We need additional `&& ! cancelled()` to have the job being able to cancel
-    if: ${{ success() || failure() || ( always() && ! cancelled() ) }}
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Style check
       runner_type: style-checker
       run_command: |
-          cd "$REPO_COPY/tests/ci"
           python3 style_check.py
+      data: ${{ needs.RunConfig.outputs.data }}
     secrets:
       secret_envs: |
         ROBOT_CLICKHOUSE_SSH_KEY<<RCSK
         ${{secrets.ROBOT_CLICKHOUSE_SSH_KEY}}
         RCSK
+  DocsCheck:
+    needs: [RunConfig, StyleCheck]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docs check
+      runner_type: func-tester-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
+        python3 docs_check.py
   FastTest:
-    needs: DockerHubPush
+    needs: [RunConfig, StyleCheck]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Fast tests
       runner_type: builder
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-          cd "$REPO_COPY/tests/ci"
           python3 fast_test_check.py
   CompatibilityCheckX86:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (amd64)" --check-glibc --check-distributions
   CompatibilityCheckAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (aarch64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (aarch64)" --check-glibc
 #########################################################################################
 #################################### ORDINARY BUILDS ####################################
 #########################################################################################
+  BuilderDebDebug:
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_build.yml
+    with:
+      build_name: package_debug
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebRelease:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_release
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAarch64:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_aarch64
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinRelease:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_release
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAsan:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_asan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebUBsan:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_ubsan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebTsan:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_tsan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebMsan:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_msan
-  BuilderDebDebug:
-    needs: [FastTest, StyleCheck]
-    uses: ./.github/workflows/reusable_build.yml
-    with:
-      build_name: package_debug
+      data: ${{ needs.RunConfig.outputs.data }}
 ##########################################################################################
 ##################################### SPECIAL BUILDS #####################################
 ##########################################################################################
   BuilderBinClangTidy:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_tidy
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinDarwin:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinAarch64:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinFreeBSD:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_freebsd
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinDarwinAarch64:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin_aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinPPC64:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_ppc64le
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinAmd64Compat:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_amd64_compat
+      data: ${{ needs.RunConfig.outputs.data }}
+  BuilderBinAmd64Musl:
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_build.yml
+    with:
+      build_name: binary_amd64_musl
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinAarch64V80Compat:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_aarch64_v80compat
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinRISCV64:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_riscv64
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinS390X:
-    needs: [FastTest, StyleCheck]
+    needs: [RunConfig, FastTest]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_s390x
+      data: ${{ needs.RunConfig.outputs.data }}
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
   DockerServerImages:
-    needs:
-      - BuilderDebRelease
-      - BuilderDebAarch64
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
-          filter: tree:0
-      - name: Check docker clickhouse/clickhouse-server building
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_server.py --release-type head --no-push \
-            --image-repo clickhouse/clickhouse-server --image-path docker/server
-          python3 docker_server.py --release-type head --no-push \
-            --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper
-      - name: Cleanup
-        if: always()
-        run: |
-          docker ps --quiet | xargs --no-run-if-empty docker kill ||:
-          docker ps --all --quiet | xargs --no-run-if-empty docker rm -f ||:
-          sudo rm -fr "$TEMP_PATH"
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker server and keeper images
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      checkout_depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
+      run_command: |
+        cd "$GITHUB_WORKSPACE/tests/ci"
+        python3 docker_server.py --release-type head --no-push \
+          --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+        python3 docker_server.py --release-type head --no-push \
+          --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
 ##################################### BUILD REPORTER #######################################
 ############################################################################################
   BuilderReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
+      - RunConfig
       - BuilderBinRelease
       - BuilderDebAarch64
       - BuilderDebAsan
@@ -303,16 +307,18 @@ jobs:
     with:
       test_name: ClickHouse build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
   BuilderSpecialReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
+      - RunConfig
       - BuilderBinAarch64
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64
@@ -327,223 +333,159 @@ jobs:
     with:
       test_name: ClickHouse special build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
 ############################################################################################
 #################################### INSTALL PACKAGES ######################################
 ############################################################################################
   InstallPackagesTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
   InstallPackagesTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (arm64)
       runner_type: style-checker-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
 ##############################################################################################
 ########################### FUNCTIONAl STATELESS TESTS #######################################
 ##############################################################################################
   FunctionalStatelessTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseDatabaseReplicated:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release, DatabaseReplicated)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
-  FunctionalStatelessTestReleaseWideParts:
-    needs: [BuilderDebRelease]
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateless tests (release, wide parts enabled)
-      runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseAnalyzer:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release, analyzer)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestReleaseS3:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release, s3 storage)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 2
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestS3Debug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (debug, s3 storage)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestS3Tsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (tsan, s3 storage)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 5
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (aarch64)
       runner_type: func-tester-aarch64
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (asan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (tsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 5
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (msan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (ubsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 2
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (debug)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 5
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestFlakyCheck:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests flaky check (asan)
+      data: ${{ needs.RunConfig.outputs.data }}
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
   TestsBugfixCheck:
-    needs: [CheckLabels, StyleCheck]
+    needs: [RunConfig, StyleCheck]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: tests bugfix validate check
       runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         KILL_TIMEOUT=3600
       run_command: |
-        cd "$REPO_COPY/tests/ci"
-
-        mkdir -p "${REPORTS_PATH}/integration"
-        mkdir -p "${REPORTS_PATH}/stateless"
-        cp -r ${REPORTS_PATH}/changed_images* ${REPORTS_PATH}/integration
-        cp -r ${REPORTS_PATH}/changed_images* ${REPORTS_PATH}/stateless
-
         TEMP_PATH="${TEMP_PATH}/integration" \
-          REPORTS_PATH="${REPORTS_PATH}/integration" \
           python3 integration_test_check.py "Integration $CHECK_NAME" \
             --validate-bugfix --post-commit-status=file || echo 'ignore exit code'
 
         TEMP_PATH="${TEMP_PATH}/stateless" \
-          REPORTS_PATH="${REPORTS_PATH}/stateless" \
           python3 functional_test_check.py "Stateless $CHECK_NAME" "$KILL_TIMEOUT" \
             --validate-bugfix --post-commit-status=file || echo 'ignore exit code'
 
@@ -552,441 +494,388 @@ jobs:
 ############################ FUNCTIONAl STATEFUL TESTS #######################################
 ##############################################################################################
   FunctionalStatefulTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (release)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (aarch64)
       runner_type: func-tester-aarch64
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (asan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (tsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (msan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (ubsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (debug)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   # Parallel replicas
   FunctionalStatefulTestDebugParallelReplicas:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (debug, ParallelReplicas)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestUBsanParallelReplicas:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (ubsan, ParallelReplicas)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestMsanParallelReplicas:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (msan, ParallelReplicas)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestTsanParallelReplicas:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (tsan, ParallelReplicas)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAsanParallelReplicas:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (asan, ParallelReplicas)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestReleaseParallelReplicas:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (release, ParallelReplicas)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
+      data: ${{ needs.RunConfig.outputs.data }}
+##############################################################################################
+########################### ClickBench #######################################################
+##############################################################################################
+  ClickBenchAMD64:
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: ClickBench (amd64)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+        python3 clickbench.py "$CHECK_NAME"
+  ClickBenchAarch64:
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: ClickBench (aarch64)
+      runner_type: func-tester-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
+      run_command: |
+        python3 clickbench.py "$CHECK_NAME"
 ##############################################################################################
 ######################################### STRESS TESTS #######################################
 ##############################################################################################
   StressTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (asan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (tsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (msan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (ubsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (debug)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ######################################### UPGRADE CHECK ######################################
 ##############################################################################################
   UpgradeCheckAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Upgrade check (asan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 upgrade_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UpgradeCheckTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Upgrade check (tsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 upgrade_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UpgradeCheckMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Upgrade check (msan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 upgrade_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UpgradeCheckDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Upgrade check (debug)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 upgrade_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ##################################### AST FUZZERS ############################################
 ##############################################################################################
   ASTFuzzerTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (asan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (tsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestUBSan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (ubsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestMSan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (msan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   ASTFuzzerTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: AST fuzzer (debug)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 ast_fuzzer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 ############################# INTEGRATION TESTS #############################################
 #############################################################################################
   IntegrationTestsAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (asan)
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsAnalyzerAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (asan, analyzer)
       runner_type: stress-tester
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (tsan)
       runner_type: stress-tester
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (release)
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsFlakyCheck:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests flaky check (asan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 #################################### UNIT TESTS #############################################
 #############################################################################################
   UnitTestsAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (asan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsReleaseClang:
-    needs: [BuilderBinRelease]
+    needs: [RunConfig, BuilderBinRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (release)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (tsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (msan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   UnitTestsUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Unit tests (ubsan)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 unit_tests_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 #################################### PERFORMANCE TESTS ######################################
 #############################################################################################
   PerformanceComparisonX86:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Performance Comparison
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 performance_comparison_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   PerformanceComparisonAarch:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Performance Comparison Aarch64
       runner_type: func-tester-aarch64
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 performance_comparison_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ###################################### SQLANCER FUZZERS ######################################
 ##############################################################################################
   SQLancerTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: SQLancer (release)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 sqlancer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   SQLancerTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: SQLancer (debug)
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 sqlancer_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   FinishCheck:
+    if: ${{ !failure() && !cancelled() }}
     needs:
-      - StyleCheck
-      - DockerHubPush
-      - DockerServerImages
-      - CheckLabels
       - BuilderReport
       - BuilderSpecialReport
+      - DocsCheck
       - FastTest
       - FunctionalStatelessTestDebug
       - FunctionalStatelessTestRelease
       - FunctionalStatelessTestReleaseDatabaseReplicated
-      - FunctionalStatelessTestReleaseWideParts
       - FunctionalStatelessTestReleaseAnalyzer
       - FunctionalStatelessTestAarch64
       - FunctionalStatelessTestAsan
@@ -1054,28 +943,24 @@ jobs:
 ############################ SQLLOGIC TEST ###################################################
 ##############################################################################################
   SQLLogicTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Sqllogic test (release)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 sqllogic_test.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ##################################### SQL TEST ###############################################
 ##############################################################################################
   SQLTest:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: SQLTest
       runner_type: fuzzer-unit-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 sqltest.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 ###################################### NOT IN FINISH ########################################
 #############################################################################################
@@ -1085,13 +970,15 @@ jobs:
     # This is special test NOT INCLUDED in FinishCheck
     # When it's skipped, all dependent tasks will be skipped too.
     # DO NOT add it there
-    if: contains(github.event.pull_request.labels.*.name, 'jepsen-test')
-    needs: [BuilderBinRelease]
+    if: ${{ !failure() && !cancelled() && contains(github.event.pull_request.labels.*.name, 'jepsen-test') }}
+    needs: [RunConfig, BuilderBinRelease]
     uses: ./.github/workflows/jepsen.yml
 #############################################################################################
 ####################################### libFuzzer ###########################################
 #############################################################################################
   libFuzzer:
-    if: contains(github.event.pull_request.labels.*.name, 'libFuzzer')
-    needs: [DockerHubPush, StyleCheck]
+    if: ${{ !failure() && !cancelled() && contains(github.event.pull_request.labels.*.name, 'libFuzzer') }}
+    needs: [RunConfig, StyleCheck]
     uses: ./.github/workflows/libfuzzer.yml
+    with:
+      data: ${{ needs.RunConfig.outputs.data }}
diff --git a/.github/workflows/release_branches.yml b/.github/workflows/release_branches.yml
index b5771fa87ab..69229ef75df 100644
--- a/.github/workflows/release_branches.yml
+++ b/.github/workflows/release_branches.yml
@@ -13,171 +13,169 @@ on: # yamllint disable-line rule:truthy
       - '2[1-9].[1-9]'
 
 jobs:
-  DockerHubPushAarch64:
-    runs-on: [self-hosted, style-checker-aarch64]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_aarch64.json
-  DockerHubPushAmd64:
+  RunConfig:
     runs-on: [self-hosted, style-checker]
+    outputs:
+      data: ${{ steps.runconfig.outputs.CI_DATA }}
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
-          clear-repository: true
-      - name: Images check
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_images_check.py --suffix amd64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}/docker_images_check/changed_images_amd64.json
-  DockerHubPush:
-    needs: [DockerHubPushAmd64, DockerHubPushAarch64]
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # to find ancestor merge commits necessary for finding proper docker tags
+          clear-repository: true # to ensure correct digests
+          fetch-depth: 0 # to get version
           filter: tree:0
-      - name: Download changed aarch64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_aarch64
-          path: ${{ runner.temp }}
-      - name: Download changed amd64 images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images_amd64
-          path: ${{ runner.temp }}
-      - name: Images check
+      - name: Labels check
         run: |
           cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64
-      - name: Upload images files to artifacts
-        uses: actions/upload-artifact@v3
-        with:
-          name: changed_images
-          path: ${{ runner.temp }}/changed_images.json
+          python3 run_check.py
+      - name: Python unit tests
+        run: |
+          cd "$GITHUB_WORKSPACE/tests/ci"
+          echo "Testing the main ci directory"
+          python3 -m unittest discover -s . -p 'test_*.py'
+          for dir in *_lambda/; do
+            echo "Testing $dir"
+            python3 -m unittest discover -s "$dir" -p 'test_*.py'
+          done
+      - name: PrepareRunConfig
+        id: runconfig
+        run: |
+            echo "::group::configure CI run"
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --configure --rebuild-all-binaries --outfile ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+            echo "::group::CI run configure results"
+            python3 -m json.tool ${{ runner.temp }}/ci_run_data.json
+            echo "::endgroup::"
+            {
+              echo 'CI_DATA<<EOF'
+              cat  ${{ runner.temp }}/ci_run_data.json
+              echo 'EOF'
+            } >> "$GITHUB_OUTPUT"
+      - name: Re-create GH statuses for skipped jobs if any
+        run: |
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ runner.temp }}/ci_run_data.json --update-gh-statuses
+  BuildDockers:
+    needs: [RunConfig]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_docker.yml
+    with:
+      data: ${{ needs.RunConfig.outputs.data }}
   CompatibilityCheckX86:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (amd64)" --check-glibc --check-distributions
   CompatibilityCheckAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
-      test_name: Compatibility check X86
+      test_name: Compatibility check (aarch64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 compatibility_check.py --check-name "Compatibility check (aarch64)" --check-glibc
 #########################################################################################
 #################################### ORDINARY BUILDS ####################################
 #########################################################################################
   BuilderDebRelease:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_release
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAarch64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_aarch64
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebAsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_asan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebUBsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_ubsan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebTsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_tsan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebMsan:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_msan
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderDebDebug:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: package_debug
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinDarwin:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
   BuilderBinDarwinAarch64:
-    needs: [DockerHubPush]
+    needs: [RunConfig, BuildDockers]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_build.yml
     with:
       build_name: binary_darwin_aarch64
       checkout_depth: 0
+      data: ${{ needs.RunConfig.outputs.data }}
 ############################################################################################
 ##################################### Docker images  #######################################
 ############################################################################################
   DockerServerImages:
-    needs:
-      - BuilderDebRelease
-      - BuilderDebAarch64
-    runs-on: [self-hosted, style-checker]
-    steps:
-      - name: Check out repository code
-        uses: ClickHouse/checkout@v1
-        with:
-          clear-repository: true
-          fetch-depth: 0  # It MUST BE THE SAME for all dependencies and the job itself
-          filter: tree:0
-      - name: Check docker clickhouse/clickhouse-server building
-        run: |
-          cd "$GITHUB_WORKSPACE/tests/ci"
-          python3 docker_server.py --release-type head --no-push \
-            --image-repo clickhouse/clickhouse-server --image-path docker/server
-          python3 docker_server.py --release-type head --no-push \
-            --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper
-      - name: Cleanup
-        if: always()
-        run: |
-          docker ps --quiet | xargs --no-run-if-empty docker kill ||:
-          docker ps --all --quiet | xargs --no-run-if-empty docker rm -f ||:
-          sudo rm -fr "$TEMP_PATH"
+    needs: [RunConfig, BuilderDebRelease, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Docker server and keeper images
+      runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
+      checkout_depth: 0
+      run_command: |
+        cd "$GITHUB_WORKSPACE/tests/ci"
+        python3 docker_server.py --release-type head --no-push \
+          --image-repo clickhouse/clickhouse-server --image-path docker/server --allow-build-reuse
+        python3 docker_server.py --release-type head --no-push \
+          --image-repo clickhouse/clickhouse-keeper --image-path docker/keeper --allow-build-reuse
 ############################################################################################
 ##################################### BUILD REPORTER #######################################
 ############################################################################################
   BuilderReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
+      - RunConfig
       - BuilderDebRelease
       - BuilderDebAarch64
       - BuilderDebAsan
@@ -189,30 +187,38 @@ jobs:
     with:
       test_name: ClickHouse build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
   BuilderSpecialReport:
-    if: ${{ success() || failure() }}
+    # run report check for failed builds to indicate the CI error
+    if: ${{ !cancelled() }}
     needs:
-      - BuilderBinDarwin
-      - BuilderBinDarwinAarch64
+      - RunConfig
+      - BuilderDebRelease
+      - BuilderDebAarch64
+      - BuilderDebAsan
+      - BuilderDebTsan
+      - BuilderDebUBsan
+      - BuilderDebMsan
+      - BuilderDebDebug
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: ClickHouse special build check
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       additional_envs: |
         NEEDS_DATA<<NDENV
         ${{ toJSON(needs) }}
         NDENV
       run_command: |
-        cd "$GITHUB_WORKSPACE/tests/ci"
         python3 build_report_check.py "$CHECK_NAME"
   MarkReleaseReady:
+    if: ${{ !failure() && !cancelled() }}
     needs:
       - BuilderBinDarwin
       - BuilderBinDarwinAarch64
@@ -232,282 +238,224 @@ jobs:
 #################################### INSTALL PACKAGES ######################################
 ############################################################################################
   InstallPackagesTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (amd64)
       runner_type: style-checker
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
   InstallPackagesTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Install packages (arm64)
       runner_type: style-checker-aarch64
+      data: ${{ needs.RunConfig.outputs.data }}
       run_command: |
-        cd "$REPO_COPY/tests/ci"
         python3 install_check.py "$CHECK_NAME"
 ##############################################################################################
 ########################### FUNCTIONAl STATELESS TESTS #######################################
 ##############################################################################################
   FunctionalStatelessTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (release)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (aarch64)
       runner_type: func-tester-aarch64
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (asan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (tsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 5
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
-  FunctionalStatelessTestUBsan:
-    needs: [BuilderDebUBsan]
-    uses: ./.github/workflows/reusable_test.yml
-    with:
-      test_name: Stateless tests (ubsan)
-      runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 2
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (msan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
+  FunctionalStatelessTestUBsan:
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
+    uses: ./.github/workflows/reusable_test.yml
+    with:
+      test_name: Stateless tests (ubsan)
+      runner_type: func-tester
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatelessTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateless tests (debug)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=10800
-      batches: 5
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ############################ FUNCTIONAl STATEFUL TESTS #######################################
 ##############################################################################################
   FunctionalStatefulTestRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (release)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAarch64:
-    needs: [BuilderDebAarch64]
+    needs: [RunConfig, BuilderDebAarch64]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (aarch64)
       runner_type: func-tester-aarch64
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (asan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (tsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (msan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (ubsan)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
   FunctionalStatefulTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stateful tests (debug)
       runner_type: func-tester
-      additional_envs: |
-        KILL_TIMEOUT=3600
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 functional_test_check.py "$CHECK_NAME" "$KILL_TIMEOUT"
+      data: ${{ needs.RunConfig.outputs.data }}
 ##############################################################################################
 ######################################### STRESS TESTS #######################################
 ##############################################################################################
   StressTestAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (asan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (tsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestMsan:
-    needs: [BuilderDebMsan]
+    needs: [RunConfig, BuilderDebMsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (msan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestUBsan:
-    needs: [BuilderDebUBsan]
+    needs: [RunConfig, BuilderDebUBsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (ubsan)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   StressTestDebug:
-    needs: [BuilderDebDebug]
+    needs: [RunConfig, BuilderDebDebug]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Stress test (debug)
       runner_type: stress-tester
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 stress_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
 #############################################################################################
 ############################# INTEGRATION TESTS #############################################
 #############################################################################################
   IntegrationTestsAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (asan)
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsAnalyzerAsan:
-    needs: [BuilderDebAsan]
+    needs: [RunConfig, BuilderDebAsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (asan, analyzer)
       runner_type: stress-tester
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsTsan:
-    needs: [BuilderDebTsan]
+    needs: [RunConfig, BuilderDebTsan]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (tsan)
       runner_type: stress-tester
-      batches: 6
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   IntegrationTestsRelease:
-    needs: [BuilderDebRelease]
+    needs: [RunConfig, BuilderDebRelease]
+    if: ${{ !failure() && !cancelled() }}
     uses: ./.github/workflows/reusable_test.yml
     with:
       test_name: Integration tests (release)
       runner_type: stress-tester
-      batches: 4
-      run_command: |
-        cd "$REPO_COPY/tests/ci"
-        python3 integration_test_check.py "$CHECK_NAME"
+      data: ${{ needs.RunConfig.outputs.data }}
   FinishCheck:
+    if: ${{ !failure() && !cancelled() }}
     needs:
-      - DockerHubPush
       - DockerServerImages
       - BuilderReport
       - BuilderSpecialReport
diff --git a/.github/workflows/reusable_build.yml b/.github/workflows/reusable_build.yml
index f36b93bea58..e6aa04a3569 100644
--- a/.github/workflows/reusable_build.yml
+++ b/.github/workflows/reusable_build.yml
@@ -22,6 +22,10 @@ name: Build ClickHouse
         description: the label of runner to use
         default: builder
         type: string
+      data:
+        description: json ci data
+        type: string
+        required: true
       additional_envs:
         description: additional ENV variables to setup the job
         type: string
@@ -29,6 +33,7 @@ name: Build ClickHouse
 jobs:
   Build:
     name: Build-${{inputs.build_name}}
+    if: contains(fromJson(inputs.data).jobs_data.jobs_to_do, inputs.build_name)
     env:
       GITHUB_JOB_OVERRIDDEN: Build-${{inputs.build_name}}
     runs-on: [self-hosted, '${{inputs.runner_type}}']
@@ -37,6 +42,7 @@ jobs:
         uses: ClickHouse/checkout@v1
         with:
           clear-repository: true
+          ref: ${{ fromJson(inputs.data).git_ref }}
           submodules: true
           fetch-depth: ${{inputs.checkout_depth}}
           filter: tree:0
@@ -44,6 +50,9 @@ jobs:
         run: |
           cat >> "$GITHUB_ENV" << 'EOF'
           ${{inputs.additional_envs}}
+          DOCKER_TAG<<DOCKER_JSON
+          ${{ toJson(fromJson(inputs.data).docker_data.images) }}
+          DOCKER_JSON
           EOF
           python3 "$GITHUB_WORKSPACE"/tests/ci/ci_config.py --build-name "${{inputs.build_name}}" >> "$GITHUB_ENV"
       - name: Apply sparse checkout for contrib # in order to check that it doesn't break build
@@ -60,20 +69,20 @@ jobs:
         uses: ./.github/actions/common_setup
         with:
           job_type: build_check
-      - name: Download changed images
-        uses: actions/download-artifact@v3
-        with:
-          name: changed_images
-          path: ${{ env.IMAGES_PATH }}
+      - name: Pre
+        run: |
+          python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --pre --job-name '${{inputs.build_name}}'
       - name: Build
         run: |
-          cd "$REPO_COPY/tests/ci" && python3 build_check.py "$BUILD_NAME"
-      - name: Upload build URLs to artifacts
-        if: ${{ success() || failure() }}
-        uses: actions/upload-artifact@v3
-        with:
-          name: ${{ env.BUILD_URLS }}
-          path: ${{ env.TEMP_PATH }}/${{ env.BUILD_URLS }}.json
+          python3 "$GITHUB_WORKSPACE/tests/ci/build_check.py" "$BUILD_NAME"
+      - name: Post
+        # it still be build report to upload for failed build job
+        if: always()
+        run: |
+          python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --post --job-name '${{inputs.build_name}}'
+      - name: Mark as done
+        run: |
+          python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --mark-success --job-name '${{inputs.build_name}}'
       - name: Clean
         if: always()
         uses: ./.github/actions/clean
diff --git a/.github/workflows/reusable_docker.yml b/.github/workflows/reusable_docker.yml
new file mode 100644
index 00000000000..08a5740e7e0
--- /dev/null
+++ b/.github/workflows/reusable_docker.yml
@@ -0,0 +1,68 @@
+name: Build docker images
+'on':
+  workflow_call:
+    inputs:
+      data:
+        description: json with ci data from todo job
+        required: true
+        type: string
+      set_latest:
+        description: set latest tag for resulting multiarch manifest
+        required: false
+        type: boolean
+        default: false
+jobs:
+  DockerBuildAarch64:
+    runs-on: [self-hosted, style-checker-aarch64]
+    if: |
+      !failure() && !cancelled() && toJson(fromJson(inputs.data).docker_data.missing_aarch64) != '[]'
+    steps:
+      - name: Check out repository code
+        uses: ClickHouse/checkout@v1
+        with:
+          ref: ${{ fromJson(inputs.data).git_ref }}
+      - name: Build images
+        run: |
+          python3 "${GITHUB_WORKSPACE}/tests/ci/docker_images_check.py" \
+            --suffix aarch64 \
+            --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
+            --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_aarch64) }}'
+  DockerBuildAmd64:
+    runs-on: [self-hosted, style-checker]
+    if: |
+      !failure() && !cancelled() && toJson(fromJson(inputs.data).docker_data.missing_amd64) != '[]'
+    steps:
+      - name: Check out repository code
+        uses: ClickHouse/checkout@v1
+        with:
+          ref: ${{ fromJson(inputs.data).git_ref }}
+      - name: Build images
+        run: |
+          python3 "${GITHUB_WORKSPACE}/tests/ci/docker_images_check.py" \
+            --suffix amd64 \
+            --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
+            --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_amd64) }}'
+  DockerMultiArchManifest:
+    needs: [DockerBuildAmd64, DockerBuildAarch64]
+    runs-on: [self-hosted, style-checker]
+    if: |
+      !failure() && !cancelled() && toJson(fromJson(inputs.data).docker_data.missing_multi) != '[]'
+    steps:
+      - name: Check out repository code
+        uses: ClickHouse/checkout@v1
+        with:
+          ref: ${{ fromJson(inputs.data).git_ref }}
+      - name: Build images
+        run: |
+          cd "$GITHUB_WORKSPACE/tests/ci"
+          if [ "${{ inputs.set_latest }}" == "true" ]; then
+            echo "latest tag will be set for resulting manifests"
+            python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64 \
+              --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
+              --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_multi) }}' \
+              --set-latest
+          else
+            python3 docker_manifests_merge.py --suffix amd64 --suffix aarch64 \
+              --image-tags '${{ toJson(fromJson(inputs.data).docker_data.images) }}' \
+              --missing-images '${{ toJson(fromJson(inputs.data).docker_data.missing_multi) }}'
+          fi
diff --git a/.github/workflows/reusable_simple_job.yml b/.github/workflows/reusable_simple_job.yml
new file mode 100644
index 00000000000..ea196a32664
--- /dev/null
+++ b/.github/workflows/reusable_simple_job.yml
@@ -0,0 +1,90 @@
+### For the pure soul wishes to move it to another place
+# https://github.com/orgs/community/discussions/9050
+
+name: Simple job
+'on':
+  workflow_call:
+    inputs:
+      test_name:
+        description: the value of test type from tests/ci/ci_config.py, ends up as $CHECK_NAME ENV
+        required: true
+        type: string
+      runner_type:
+        description: the label of runner to use
+        required: true
+        type: string
+      run_command:
+        description: the command to launch the check
+        default: ""
+        required: false
+        type: string
+      checkout_depth:
+        description: the value of the git shallow checkout
+        required: false
+        type: number
+        default: 1
+      submodules:
+        description: if the submodules should be checked out
+        required: false
+        type: boolean
+        default: false
+      additional_envs:
+        description: additional ENV variables to setup the job
+        type: string
+      working-directory:
+        description: sets custom working directory
+        type: string
+        default: ""
+      git_ref:
+        description: commit to use, merge commit for pr or head
+        required: false
+        type: string
+        default: ${{ github.event.after }} # no merge commit
+    secrets:
+      secret_envs:
+        description: if given, it's passed to the environments
+        required: false
+
+
+env:
+  # Force the stdout and stderr streams to be unbuffered
+  PYTHONUNBUFFERED: 1
+  CHECK_NAME: ${{inputs.test_name}}
+
+jobs:
+  Test:
+    runs-on: [self-hosted, '${{inputs.runner_type}}']
+    name: ${{inputs.test_name}}
+    env:
+      GITHUB_JOB_OVERRIDDEN: ${{inputs.test_name}}
+    steps:
+      - name: Check out repository code
+        uses: ClickHouse/checkout@v1
+        with:
+          clear-repository: true
+          ref: ${{ inputs.git_ref }}
+          submodules: ${{inputs.submodules}}
+          fetch-depth: ${{inputs.checkout_depth}}
+          filter: tree:0
+      - name: Set build envs
+        run: |
+          cat >> "$GITHUB_ENV" << 'EOF'
+          CHECK_NAME=${{ inputs.test_name }}
+          ${{inputs.additional_envs}}
+          ${{secrets.secret_envs}}
+          EOF
+      - name: Common setup
+        uses: ./.github/actions/common_setup
+        with:
+          job_type: test
+      - name: Run
+        run: |
+          if [ -n '${{ inputs.working-directory }}' ]; then
+            cd "${{ inputs.working-directory }}"
+          else
+            cd "$GITHUB_WORKSPACE/tests/ci"
+          fi
+          ${{ inputs.run_command }}
+      - name: Clean
+        if: always()
+        uses: ./.github/actions/clean
diff --git a/.github/workflows/reusable_test.yml b/.github/workflows/reusable_test.yml
index e82d2d51596..09177ad887a 100644
--- a/.github/workflows/reusable_test.yml
+++ b/.github/workflows/reusable_test.yml
@@ -14,13 +14,10 @@ name: Testing workflow
         required: true
         type: string
       run_command:
-        description: the command to launch the check. Usually starts with `cd '$REPO_COPY/tests/ci'`
-        required: true
+        description: the command to launch the check
+        default: ""
+        required: false
         type: string
-      batches:
-        description: how many batches for the test will be launched
-        default: 1
-        type: number
       checkout_depth:
         description: the value of the git shallow checkout
         required: false
@@ -34,80 +31,89 @@ name: Testing workflow
       additional_envs:
         description: additional ENV variables to setup the job
         type: string
+      data:
+        description: ci data
+        type: string
+        required: true
+      working-directory:
+        description: sets custom working directory
+        type: string
+        default: ""
     secrets:
       secret_envs:
         description: if given, it's passed to the environments
         required: false
 
+
 env:
   # Force the stdout and stderr streams to be unbuffered
   PYTHONUNBUFFERED: 1
   CHECK_NAME: ${{inputs.test_name}}
 
 jobs:
-  PrepareStrategy:
-    # batches < 1 is misconfiguration,
-    # and we need this step only for batches > 1
-    if: ${{ inputs.batches > 1 }}
-    runs-on: [self-hosted, style-checker-aarch64]
-    outputs:
-      batches: ${{steps.batches.outputs.batches}}
-    steps:
-      - name: Calculate batches
-        id: batches
-        run: |
-          batches_output=$(python3 -c 'import json; print(json.dumps(list(range(${{inputs.batches}}))))')
-          echo "batches=${batches_output}" >> "$GITHUB_OUTPUT"
   Test:
-    # If PrepareStrategy is skipped for batches == 1,
-    # we still need to launch the test.
-    # `! failure()` is mandatory here to launch on skipped Job
-    # `&& !cancelled()` to allow the be cancelable
-    if: ${{ ( !failure() && !cancelled() ) && inputs.batches > 0 }}
-    # Do not add `-0` to the end, if there's only one batch
-    name: ${{inputs.test_name}}${{ inputs.batches > 1 && format('-{0}',matrix.batch) || '' }}
-    env:
-      GITHUB_JOB_OVERRIDDEN: ${{inputs.test_name}}${{ inputs.batches > 1 && format('-{0}',matrix.batch) || '' }}
     runs-on: [self-hosted, '${{inputs.runner_type}}']
-    needs: [PrepareStrategy]
+    if: ${{ !failure() && !cancelled() && contains(fromJson(inputs.data).jobs_data.jobs_to_do, inputs.test_name) }}
+    name: ${{inputs.test_name}}${{ fromJson(inputs.data).jobs_data.jobs_params[inputs.test_name].num_batches > 1 && format('-{0}',matrix.batch) || '' }}
+    env:
+      GITHUB_JOB_OVERRIDDEN: ${{inputs.test_name}}${{ fromJson(inputs.data).jobs_data.jobs_params[inputs.test_name].num_batches > 1 && format('-{0}',matrix.batch) || '' }}
     strategy:
       fail-fast: false  # we always wait for entire matrix
       matrix:
-        # if PrepareStrategy does not have batches, we use 0
-        batch: ${{ needs.PrepareStrategy.outputs.batches
-          && fromJson(needs.PrepareStrategy.outputs.batches)
-          || fromJson('[0]')}}
+        batch: ${{ fromJson(inputs.data).jobs_data.jobs_params[inputs.test_name].batches }}
     steps:
       - name: Check out repository code
         uses: ClickHouse/checkout@v1
         with:
           clear-repository: true
+          ref: ${{ fromJson(inputs.data).git_ref }}
           submodules: ${{inputs.submodules}}
           fetch-depth: ${{inputs.checkout_depth}}
           filter: tree:0
       - name: Set build envs
         run: |
           cat >> "$GITHUB_ENV" << 'EOF'
+          CHECK_NAME=${{ inputs.test_name }}
           ${{inputs.additional_envs}}
           ${{secrets.secret_envs}}
+          DOCKER_TAG<<DOCKER_JSON
+          ${{ toJson(fromJson(inputs.data).docker_data.images) }}
+          DOCKER_JSON
           EOF
       - name: Common setup
         uses: ./.github/actions/common_setup
         with:
           job_type: test
-      - name: Download json reports
-        uses: actions/download-artifact@v3
-        with:
-          path: ${{ env.REPORTS_PATH }}
       - name: Setup batch
-        if: ${{ inputs.batches > 1}}
+        if: ${{ fromJson(inputs.data).jobs_data.jobs_params[inputs.test_name].num_batches > 1 }}
         run: |
           cat >> "$GITHUB_ENV" << 'EOF'
           RUN_BY_HASH_NUM=${{matrix.batch}}
-          RUN_BY_HASH_TOTAL=${{inputs.batches}}
+          RUN_BY_HASH_TOTAL=${{ fromJson(inputs.data).jobs_data.jobs_params[inputs.test_name].num_batches }}
           EOF
-      - name: Run test
-        run: ${{inputs.run_command}}
+      - name: Pre run
+        run: |
+          python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --pre --job-name '${{inputs.test_name}}'
+      - name: Run
+        run: |
+          if [ -n "${{ inputs.working-directory }}" ]; then
+            cd "${{ inputs.working-directory }}"
+          else
+            cd "$GITHUB_WORKSPACE/tests/ci"
+          fi
+          if [ -n "$(echo '${{ inputs.run_command }}' | tr -d '\n')" ]; then
+            echo "Running command from workflow input"
+            ${{ inputs.run_command }}
+          else
+            echo "Running command from job config"
+            python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --run --job-name '${{inputs.test_name}}'
+          fi
+      - name: Post run
+        run: |
+          python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --post --job-name '${{inputs.test_name}}'
+      - name: Mark as done
+        run: |
+          python3 "$GITHUB_WORKSPACE/tests/ci/ci.py" --infile ${{ toJson(inputs.data) }} --mark-success --job-name '${{inputs.test_name}}' --batch ${{matrix.batch}}
       - name: Clean
         if: always()
         uses: ./.github/actions/clean
diff --git a/.gitmessage b/.gitmessage
new file mode 100644
index 00000000000..f4a25a837bc
--- /dev/null
+++ b/.gitmessage
@@ -0,0 +1,10 @@
+
+
+## To avoid merge commit in CI run (add a leading space to apply):
+#no-merge-commit
+
+## Running specified job (add a leading space to apply):
+#job_<JOB NAME>
+#job_stateless_tests_release
+#job_package_debug
+#job_integration_tests_asan
diff --git a/CHANGELOG.md b/CHANGELOG.md
index aa40012617c..283000f1804 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -1,4 +1,6 @@
 ### Table of Contents
+**[ClickHouse release v23.12, 2023-12-28](#2312)**<br/>
+**[ClickHouse release v23.11, 2023-12-06](#2311)**<br/>
 **[ClickHouse release v23.10, 2023-11-02](#2310)**<br/>
 **[ClickHouse release v23.9, 2023-09-28](#239)**<br/>
 **[ClickHouse release v23.8 LTS, 2023-08-31](#238)**<br/>
@@ -13,7 +15,357 @@
 
 # 2023 Changelog
 
-### ClickHouse release 23.10, 2023-11-02
+### <a id="2312"></a> ClickHouse release 23.12, 2023-12-28
+
+#### Backward Incompatible Change
+* Fix check for non-deterministic functions in TTL expressions. Previously, you could create a TTL expression with non-deterministic functions in some cases, which could lead to undefined behavior later. This fixes [#37250](https://github.com/ClickHouse/ClickHouse/issues/37250). Disallow TTL expressions that don't depend on any columns of a table by default. It can be allowed back by `SET allow_suspicious_ttl_expressions = 1` or `SET compatibility = '23.11'`. Closes [#37286](https://github.com/ClickHouse/ClickHouse/issues/37286). [#51858](https://github.com/ClickHouse/ClickHouse/pull/51858) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for the `OPTIMIZE` is not allowed by default (it can be unlocked with the `allow_experimental_replacing_merge_with_cleanup` setting). [#58267](https://github.com/ClickHouse/ClickHouse/pull/58267) ([Alexander Tokmakov](https://github.com/tavplubix)). This fixes [#57930](https://github.com/ClickHouse/ClickHouse/issues/57930). This closes [#54988](https://github.com/ClickHouse/ClickHouse/issues/54988). This closes [#54570](https://github.com/ClickHouse/ClickHouse/issues/54570). This closes [#50346](https://github.com/ClickHouse/ClickHouse/issues/50346). This closes [#47579](https://github.com/ClickHouse/ClickHouse/issues/47579). The feature has to be removed because it is not good. We have to remove it as quickly as possible, because there is no other option. [#57932](https://github.com/ClickHouse/ClickHouse/pull/57932) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### New Feature
+* Implement Refreshable Materialized Views, requested in [#33919](https://github.com/ClickHouse/ClickHouse/issues/57995). [#56946](https://github.com/ClickHouse/ClickHouse/pull/56946) ([Michael Kolupaev](https://github.com/al13n321), [Michael Guzov](https://github.com/koloshmet)).
+* Introduce `PASTE JOIN`, which allows users to join tables without `ON` clause simply by row numbers. Example: `SELECT * FROM (SELECT number AS a FROM numbers(2)) AS t1 PASTE JOIN (SELECT number AS a FROM numbers(2) ORDER BY a DESC) AS t2`. [#57995](https://github.com/ClickHouse/ClickHouse/pull/57995) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* The `ORDER BY` clause now supports specifying `ALL`, meaning that ClickHouse sorts by all columns in the `SELECT` clause. Example: `SELECT col1, col2 FROM tab WHERE [...] ORDER BY ALL`. [#57875](https://github.com/ClickHouse/ClickHouse/pull/57875) ([zhongyuankai](https://github.com/zhongyuankai)).
+* Added a new mutation command `ALTER TABLE <table> APPLY DELETED MASK`, which allows to enforce applying of mask written by lightweight delete and to remove rows marked as deleted from disk. [#57433](https://github.com/ClickHouse/ClickHouse/pull/57433) ([Anton Popov](https://github.com/CurtizJ)).
+* A handler `/binary` opens a visual viewer of symbols inside the ClickHouse binary. [#58211](https://github.com/ClickHouse/ClickHouse/pull/58211) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Added a new SQL function `sqid` to generate Sqids (https://sqids.org/), example: `SELECT sqid(125, 126)`. [#57512](https://github.com/ClickHouse/ClickHouse/pull/57512) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add a new function `seriesPeriodDetectFFT` to detect series period using FFT. [#57574](https://github.com/ClickHouse/ClickHouse/pull/57574) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Add an HTTP endpoint for checking if Keeper is ready to accept traffic. [#55876](https://github.com/ClickHouse/ClickHouse/pull/55876) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Add 'union' mode for schema inference. In this mode the resulting table schema is the union of all files schemas (so schema is inferred from each file). The mode of schema inference is controlled by a setting `schema_inference_mode` with two possible values - `default` and `union`. Closes [#55428](https://github.com/ClickHouse/ClickHouse/issues/55428). [#55892](https://github.com/ClickHouse/ClickHouse/pull/55892) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add new setting `input_format_csv_try_infer_numbers_from_strings` that allows to infer numbers from strings in CSV format. Closes [#56455](https://github.com/ClickHouse/ClickHouse/issues/56455). [#56859](https://github.com/ClickHouse/ClickHouse/pull/56859) ([Kruglov Pavel](https://github.com/Avogar)).
+* When the number of databases or tables exceeds a configurable threshold, show a warning to the user. [#57375](https://github.com/ClickHouse/ClickHouse/pull/57375) ([凌涛](https://github.com/lingtaolf)).
+* Dictionary with `HASHED_ARRAY` (and `COMPLEX_KEY_HASHED_ARRAY`) layout supports `SHARDS` similarly to `HASHED`. [#57544](https://github.com/ClickHouse/ClickHouse/pull/57544) ([vdimir](https://github.com/vdimir)).
+* Add asynchronous metrics for total primary key bytes and total allocated primary key bytes in memory. [#57551](https://github.com/ClickHouse/ClickHouse/pull/57551) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add `SHA512_256` function. [#57645](https://github.com/ClickHouse/ClickHouse/pull/57645) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add `FORMAT_BYTES` as an alias for `formatReadableSize`. [#57592](https://github.com/ClickHouse/ClickHouse/pull/57592) ([Bharat Nallan](https://github.com/bharatnc)).
+* Allow passing optional session token to the `s3` table function. [#57850](https://github.com/ClickHouse/ClickHouse/pull/57850) ([Shani Elharrar](https://github.com/shanielh)).
+* Introduce a new setting `http_make_head_request`. If it is turned off, the URL table engine will not do a HEAD request to determine the file size. This is needed to support inefficient, misconfigured, or not capable HTTP servers. [#54602](https://github.com/ClickHouse/ClickHouse/pull/54602) ([Fionera](https://github.com/fionera)).
+* It is now possible to refer to ALIAS column in index (non-primary-key) definitions (issue [#55650](https://github.com/ClickHouse/ClickHouse/issues/55650)). Example: `CREATE TABLE tab(col UInt32, col_alias ALIAS col + 1, INDEX idx (col_alias) TYPE minmax) ENGINE = MergeTree ORDER BY col;`. [#57546](https://github.com/ClickHouse/ClickHouse/pull/57546) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added a new setting `readonly` which can be used to specify an S3 disk is read only. It can be useful to create a table on a disk of `s3_plain` type, while having read only access to the underlying S3 bucket. [#57977](https://github.com/ClickHouse/ClickHouse/pull/57977) ([Pengyuan Bian](https://github.com/bianpengyuan)).
+* The primary key analysis in MergeTree tables will now be applied to predicates that include the virtual column `_part_offset` (optionally with `_part`). This feature can serve as a special kind of a secondary index. [#58224](https://github.com/ClickHouse/ClickHouse/pull/58224) ([Amos Bird](https://github.com/amosbird)).
+
+#### Performance Improvement
+* Extract non-intersecting parts ranges from MergeTree table during FINAL processing. That way we can avoid additional FINAL logic for this non-intersecting parts ranges. In case when amount of duplicate values with same primary key is low, performance will be almost the same as without FINAL. Improve reading performance for MergeTree FINAL when `do_not_merge_across_partitions_select_final` setting is set. [#58120](https://github.com/ClickHouse/ClickHouse/pull/58120) ([Maksim Kita](https://github.com/kitaisreal)).
+* Made copy between s3 disks using a s3-server-side copy instead of copying through the buffer. Improves `BACKUP/RESTORE` operations and `clickhouse-disks copy` command. [#56744](https://github.com/ClickHouse/ClickHouse/pull/56744) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Hash JOIN respects setting `max_joined_block_size_rows` and do not produce large blocks for `ALL JOIN`. [#56996](https://github.com/ClickHouse/ClickHouse/pull/56996) ([vdimir](https://github.com/vdimir)).
+* Release memory for aggregation earlier. This may avoid unnecessary external aggregation. [#57691](https://github.com/ClickHouse/ClickHouse/pull/57691) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Improve performance of string serialization. [#57717](https://github.com/ClickHouse/ClickHouse/pull/57717) ([Maksim Kita](https://github.com/kitaisreal)).
+* Support trivial count optimization for `Merge`-engine tables. [#57867](https://github.com/ClickHouse/ClickHouse/pull/57867) ([skyoct](https://github.com/skyoct)).
+* Optimized aggregation in some cases. [#57872](https://github.com/ClickHouse/ClickHouse/pull/57872) ([Anton Popov](https://github.com/CurtizJ)).
+* The `hasAny` function can now take advantage of the full-text skipping indices. [#57878](https://github.com/ClickHouse/ClickHouse/pull/57878) ([Jpnock](https://github.com/Jpnock)).
+* Function `if(cond, then, else)` (and its alias `cond ? then : else`) were optimized to use branch-free evaluation. [#57885](https://github.com/ClickHouse/ClickHouse/pull/57885) ([zhanglistar](https://github.com/zhanglistar)).
+* MergeTree automatically derive `do_not_merge_across_partitions_select_final` setting if partition key expression contains only columns from primary key expression. [#58218](https://github.com/ClickHouse/ClickHouse/pull/58218) ([Maksim Kita](https://github.com/kitaisreal)).
+* Speedup `MIN` and `MAX` for native types. [#58231](https://github.com/ClickHouse/ClickHouse/pull/58231) ([Raúl Marín](https://github.com/Algunenano)).
+* Implement `SLRU` cache policy for filesystem cache. [#57076](https://github.com/ClickHouse/ClickHouse/pull/57076) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* The limit for the number of connections per endpoint for background fetches was raised from `15` to the value of `background_fetches_pool_size` setting. - MergeTree-level setting `replicated_max_parallel_fetches_for_host` became obsolete - MergeTree-level settings `replicated_fetches_http_connection_timeout`, `replicated_fetches_http_send_timeout` and `replicated_fetches_http_receive_timeout` are moved to the Server-level. - Setting `keep_alive_timeout` is added to the list of Server-level settings. [#57523](https://github.com/ClickHouse/ClickHouse/pull/57523) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Make querying `system.filesystem_cache` not memory intensive. [#57687](https://github.com/ClickHouse/ClickHouse/pull/57687) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Reduce memory usage on strings deserialization. [#57787](https://github.com/ClickHouse/ClickHouse/pull/57787) ([Maksim Kita](https://github.com/kitaisreal)).
+* More efficient constructor for Enum - it makes sense when Enum has a boatload of values. [#57887](https://github.com/ClickHouse/ClickHouse/pull/57887) ([Duc Canh Le](https://github.com/canhld94)).
+* An improvement for reading from the filesystem cache: always use `pread` method. [#57970](https://github.com/ClickHouse/ClickHouse/pull/57970) ([Nikita Taranov](https://github.com/nickitat)).
+* Add optimization for AND notEquals chain in logical expression optimizer. This optimization is only available with the experimental Analyzer enabled. [#58214](https://github.com/ClickHouse/ClickHouse/pull/58214) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
+
+#### Improvement
+* Support for soft memory limit in Keeper. It will refuse requests if the memory usage is close to the maximum. [#57271](https://github.com/ClickHouse/ClickHouse/pull/57271) ([Han Fei](https://github.com/hanfei1991)). [#57699](https://github.com/ClickHouse/ClickHouse/pull/57699) ([Han Fei](https://github.com/hanfei1991)).
+* Make inserts into distributed tables handle updated cluster configuration properly. When the list of cluster nodes is dynamically updated, the Directory Monitor of the distribution table will update it. [#42826](https://github.com/ClickHouse/ClickHouse/pull/42826) ([zhongyuankai](https://github.com/zhongyuankai)).
+* Do not allow creating a replicated table with inconsistent merge parameters. [#56833](https://github.com/ClickHouse/ClickHouse/pull/56833) ([Duc Canh Le](https://github.com/canhld94)).
+* Show uncompressed size in `system.tables`. [#56618](https://github.com/ClickHouse/ClickHouse/issues/56618). [#57186](https://github.com/ClickHouse/ClickHouse/pull/57186) ([Chen Lixiang](https://github.com/chenlx0)).
+* Add `skip_unavailable_shards` as a setting for `Distributed` tables that is similar to the corresponding query-level setting. Closes [#43666](https://github.com/ClickHouse/ClickHouse/issues/43666). [#57218](https://github.com/ClickHouse/ClickHouse/pull/57218) ([Gagan Goel](https://github.com/tntnatbry)).
+* The function `substring` (aliases: `substr`, `mid`) can now be used with `Enum` types. Previously, the first function argument had to be a value of type `String` or `FixedString`. This improves compatibility with 3rd party tools such as Tableau via MySQL interface. [#57277](https://github.com/ClickHouse/ClickHouse/pull/57277) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Function `format` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). This is important to calculate `SELECT format('The {0} to all questions is {1}', 'answer', 42)`. [#57549](https://github.com/ClickHouse/ClickHouse/pull/57549) ([Robert Schulze](https://github.com/rschu1ze)).
+* Allows to use the `date_trunc` function with a case-insensitive first argument. Both cases are now supported: `SELECT date_trunc('day', now())` and `SELECT date_trunc('DAY', now())`. [#57624](https://github.com/ClickHouse/ClickHouse/pull/57624) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Better hints when a table doesn't exist. [#57342](https://github.com/ClickHouse/ClickHouse/pull/57342) ([Bharat Nallan](https://github.com/bharatnc)).
+* Allow to overwrite `max_partition_size_to_drop` and `max_table_size_to_drop` server settings in query time. [#57452](https://github.com/ClickHouse/ClickHouse/pull/57452) ([Jordi Villar](https://github.com/jrdi)).
+* Slightly better inference of unnamed tupes in JSON formats. [#57751](https://github.com/ClickHouse/ClickHouse/pull/57751) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add support for read-only flag when connecting to Keeper (fixes [#53749](https://github.com/ClickHouse/ClickHouse/issues/53749)). [#57479](https://github.com/ClickHouse/ClickHouse/pull/57479) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Fix possible distributed sends stuck due to "No such file or directory" (during recovering a batch from disk). Fix possible issues with `error_count` from `system.distribution_queue` (in case of `distributed_directory_monitor_max_sleep_time_ms` >5min). Introduce profile event to track async INSERT failures - `DistributedAsyncInsertionFailures`. [#57480](https://github.com/ClickHouse/ClickHouse/pull/57480) ([Azat Khuzhin](https://github.com/azat)).
+* Support PostgreSQL generated columns and default column values in `MaterializedPostgreSQL` (experimental feature). Closes [#40449](https://github.com/ClickHouse/ClickHouse/issues/40449). [#57568](https://github.com/ClickHouse/ClickHouse/pull/57568) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Allow to apply some filesystem cache config settings changes without server restart. [#57578](https://github.com/ClickHouse/ClickHouse/pull/57578) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Properly handling PostgreSQL table structure with empty array. [#57618](https://github.com/ClickHouse/ClickHouse/pull/57618) ([Mike Kot](https://github.com/myrrc)).
+* Expose the total number of errors occurred since last server restart as a `ClickHouseErrorMetric_ALL` metric. [#57627](https://github.com/ClickHouse/ClickHouse/pull/57627) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow nodes in the configuration file with `from_env`/`from_zk` reference and non empty element with replace=1. [#57628](https://github.com/ClickHouse/ClickHouse/pull/57628) ([Azat Khuzhin](https://github.com/azat)).
+* A table function `fuzzJSON` which allows generating a lot of malformed JSON for fuzzing. [#57646](https://github.com/ClickHouse/ClickHouse/pull/57646) ([Julia Kartseva](https://github.com/jkartseva)).
+* Allow IPv6 to UInt128 conversion and binary arithmetic. [#57707](https://github.com/ClickHouse/ClickHouse/pull/57707) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Add a setting for `async inserts deduplication cache` - how long we wait for cache update. Deprecate setting `async_block_ids_cache_min_update_interval_ms`. Now cache is updated only in case of conflicts. [#57743](https://github.com/ClickHouse/ClickHouse/pull/57743) ([alesapin](https://github.com/alesapin)).
+* `sleep()` function now can be cancelled with `KILL QUERY`. [#57746](https://github.com/ClickHouse/ClickHouse/pull/57746) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Forbid `CREATE TABLE ... AS SELECT` queries for `Replicated` table engines in the experimental `Replicated` database because they are not supported. Reference [#35408](https://github.com/ClickHouse/ClickHouse/issues/35408). [#57796](https://github.com/ClickHouse/ClickHouse/pull/57796) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix and improve transforming queries for external databases, to recursively obtain all compatible predicates. [#57888](https://github.com/ClickHouse/ClickHouse/pull/57888) ([flynn](https://github.com/ucasfl)).
+* Support dynamic reloading of the filesystem cache size. Closes [#57866](https://github.com/ClickHouse/ClickHouse/issues/57866). [#57897](https://github.com/ClickHouse/ClickHouse/pull/57897) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Correctly support `system.stack_trace` for threads with blocked SIGRTMIN (these threads can exist in low-quality external libraries such as Apache rdkafka). [#57907](https://github.com/ClickHouse/ClickHouse/pull/57907) ([Azat Khuzhin](https://github.com/azat)). Aand also send signal to the threads only if it is not blocked to avoid waiting `storage_system_stack_trace_pipe_read_timeout_ms` when it does not make any sense. [#58136](https://github.com/ClickHouse/ClickHouse/pull/58136) ([Azat Khuzhin](https://github.com/azat)).
+* Tolerate keeper failures in the quorum inserts' check. [#57986](https://github.com/ClickHouse/ClickHouse/pull/57986) ([Raúl Marín](https://github.com/Algunenano)).
+* Add max/peak RSS (`MemoryResidentMax`) into system.asynchronous_metrics. [#58095](https://github.com/ClickHouse/ClickHouse/pull/58095) ([Azat Khuzhin](https://github.com/azat)).
+* This PR allows users to use s3-style links (`https://` and `s3://`) without mentioning region if it's not default. Also find the correct region if the user mentioned the wrong one. [#58148](https://github.com/ClickHouse/ClickHouse/pull/58148) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* `clickhouse-format --obfuscate` will know about Settings, MergeTreeSettings, and time zones and keep their names unchanged. [#58179](https://github.com/ClickHouse/ClickHouse/pull/58179) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Added explicit `finalize()` function in `ZipArchiveWriter`. Simplify too complicated code in `ZipArchiveWriter`. This fixes [#58074](https://github.com/ClickHouse/ClickHouse/issues/58074). [#58202](https://github.com/ClickHouse/ClickHouse/pull/58202) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Make caches with the same path use the same cache objects. This behaviour existed before, but was broken in 23.4. If such caches with the same path have different set of cache settings, an exception will be thrown, that this is not allowed. [#58264](https://github.com/ClickHouse/ClickHouse/pull/58264) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Parallel replicas (experimental feature): friendly settings [#57542](https://github.com/ClickHouse/ClickHouse/pull/57542) ([Igor Nikonov](https://github.com/devcrafter)).
+* Parallel replicas (experimental feature): announcement response handling improvement [#57749](https://github.com/ClickHouse/ClickHouse/pull/57749) ([Igor Nikonov](https://github.com/devcrafter)).
+* Parallel replicas (experimental feature): give more respect to `min_number_of_marks` in `ParallelReplicasReadingCoordinator` [#57763](https://github.com/ClickHouse/ClickHouse/pull/57763) ([Nikita Taranov](https://github.com/nickitat)).
+* Parallel replicas (experimental feature): disable parallel replicas with IN (subquery) [#58133](https://github.com/ClickHouse/ClickHouse/pull/58133) ([Igor Nikonov](https://github.com/devcrafter)).
+* Parallel replicas (experimental feature): add profile event 'ParallelReplicasUsedCount' [#58173](https://github.com/ClickHouse/ClickHouse/pull/58173) ([Igor Nikonov](https://github.com/devcrafter)).
+* Non POST requests such as HEAD will be readonly similar to GET. [#58060](https://github.com/ClickHouse/ClickHouse/pull/58060) ([San](https://github.com/santrancisco)).
+* Add `bytes_uncompressed` column to `system.part_log` [#58167](https://github.com/ClickHouse/ClickHouse/pull/58167) ([Jordi Villar](https://github.com/jrdi)).
+* Add base backup name to `system.backups` and `system.backup_log` tables [#58178](https://github.com/ClickHouse/ClickHouse/pull/58178) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Add support for specifying query parameters in the command line in clickhouse-local [#58210](https://github.com/ClickHouse/ClickHouse/pull/58210) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+
+#### Build/Testing/Packaging Improvement
+* Randomize more settings [#39663](https://github.com/ClickHouse/ClickHouse/pull/39663) ([Anton Popov](https://github.com/CurtizJ)).
+* Randomize disabled optimizations in CI [#57315](https://github.com/ClickHouse/ClickHouse/pull/57315) ([Raúl Marín](https://github.com/Algunenano)).
+* Allow usage of Azure-related table engines/functions on macOS. [#51866](https://github.com/ClickHouse/ClickHouse/pull/51866) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* ClickHouse Fast Test now uses Musl instead of GLibc. [#57711](https://github.com/ClickHouse/ClickHouse/pull/57711) ([Alexey Milovidov](https://github.com/alexey-milovidov)). The fully-static Musl build is available to download from the CI.
+* Run ClickBench for every commit. This closes [#57708](https://github.com/ClickHouse/ClickHouse/issues/57708). [#57712](https://github.com/ClickHouse/ClickHouse/pull/57712) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove the usage of a harmful C/POSIX `select` function from external libraries. [#57467](https://github.com/ClickHouse/ClickHouse/pull/57467) ([Igor Nikonov](https://github.com/devcrafter)).
+* Settings only available in ClickHouse Cloud will be also present in the open-source ClickHouse build for convenience. [#57638](https://github.com/ClickHouse/ClickHouse/pull/57638) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+* Fixed a possibility of sorting order breakage in TTL GROUP BY [#49103](https://github.com/ClickHouse/ClickHouse/pull/49103) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix: split `lttb` bucket strategy, first bucket and last bucket should only contain single point [#57003](https://github.com/ClickHouse/ClickHouse/pull/57003) ([FFish](https://github.com/wxybear)).
+* Fix possible deadlock in the `Template` format during sync after error [#57004](https://github.com/ClickHouse/ClickHouse/pull/57004) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix early stop while parsing a file with skipping lots of errors [#57006](https://github.com/ClickHouse/ClickHouse/pull/57006) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prevent dictionary's ACL bypass via the `dictionary` table function [#57362](https://github.com/ClickHouse/ClickHouse/pull/57362) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Fix another case of a "non-ready set" error found by Fuzzer. [#57423](https://github.com/ClickHouse/ClickHouse/pull/57423) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix several issues regarding PostgreSQL `array_ndims` usage. [#57436](https://github.com/ClickHouse/ClickHouse/pull/57436) ([Ryan Jacobs](https://github.com/ryanmjacobs)).
+* Fix RWLock inconsistency after write lock timeout [#57454](https://github.com/ClickHouse/ClickHouse/pull/57454) ([Vitaly Baranov](https://github.com/vitlibar)). Fix RWLock inconsistency after write lock timeout (again) [#57733](https://github.com/ClickHouse/ClickHouse/pull/57733) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix: don't exclude ephemeral column when building pushing to view chain [#57461](https://github.com/ClickHouse/ClickHouse/pull/57461) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* MaterializedPostgreSQL (experimental issue): fix issue [#41922](https://github.com/ClickHouse/ClickHouse/issues/41922), add test for [#41923](https://github.com/ClickHouse/ClickHouse/issues/41923) [#57515](https://github.com/ClickHouse/ClickHouse/pull/57515) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Ignore ON CLUSTER clause in grant/revoke queries for management of replicated access entities.  [#57538](https://github.com/ClickHouse/ClickHouse/pull/57538) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix crash in clickhouse-local [#57553](https://github.com/ClickHouse/ClickHouse/pull/57553) ([Nikolay Degterinsky](https://github.com/evillique)).
+* A fix for Hash JOIN. [#57564](https://github.com/ClickHouse/ClickHouse/pull/57564) ([vdimir](https://github.com/vdimir)).
+* Fix possible error in PostgreSQL source [#57567](https://github.com/ClickHouse/ClickHouse/pull/57567) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix type correction in Hash JOIN for nested LowCardinality. [#57614](https://github.com/ClickHouse/ClickHouse/pull/57614) ([vdimir](https://github.com/vdimir)).
+* Avoid hangs of `system.stack_trace` by correctly prohibiting parallel reading from it. [#57641](https://github.com/ClickHouse/ClickHouse/pull/57641) ([Azat Khuzhin](https://github.com/azat)).
+* Fix an error for aggregation of sparse columns with `any(...) RESPECT NULL` [#57710](https://github.com/ClickHouse/ClickHouse/pull/57710) ([Azat Khuzhin](https://github.com/azat)).
+* Fix unary operators parsing [#57713](https://github.com/ClickHouse/ClickHouse/pull/57713) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix dependency loading for the experimental table engine `MaterializedPostgreSQL`. [#57754](https://github.com/ClickHouse/ClickHouse/pull/57754) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix retries for disconnected nodes for BACKUP/RESTORE ON CLUSTER [#57764](https://github.com/ClickHouse/ClickHouse/pull/57764) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix result of external aggregation in case of partially materialized projection [#57790](https://github.com/ClickHouse/ClickHouse/pull/57790) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix merge in aggregation functions with `*Map` combinator [#57795](https://github.com/ClickHouse/ClickHouse/pull/57795) ([Anton Popov](https://github.com/CurtizJ)).
+* Disable `system.kafka_consumers` because it has a bug. [#57822](https://github.com/ClickHouse/ClickHouse/pull/57822) ([Azat Khuzhin](https://github.com/azat)).
+* Fix LowCardinality keys support in Merge JOIN. [#57827](https://github.com/ClickHouse/ClickHouse/pull/57827) ([vdimir](https://github.com/vdimir)).
+* A fix for `InterpreterCreateQuery` related to the sample block. [#57855](https://github.com/ClickHouse/ClickHouse/pull/57855) ([Maksim Kita](https://github.com/kitaisreal)).
+* `addresses_expr` were ignored for named collections from PostgreSQL. [#57874](https://github.com/ClickHouse/ClickHouse/pull/57874) ([joelynch](https://github.com/joelynch)).
+* Fix invalid memory access in BLAKE3 (Rust) [#57876](https://github.com/ClickHouse/ClickHouse/pull/57876) ([Raúl Marín](https://github.com/Algunenano)). Then it was rewritten from Rust to C++ for better [memory-safety](https://www.memorysafety.org/). [#57994](https://github.com/ClickHouse/ClickHouse/pull/57994) ([Raúl Marín](https://github.com/Algunenano)).
+* Normalize function names in `CREATE INDEX` [#57906](https://github.com/ClickHouse/ClickHouse/pull/57906) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix handling of unavailable replicas before first request happened [#57933](https://github.com/ClickHouse/ClickHouse/pull/57933) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix literal alias misclassification [#57988](https://github.com/ClickHouse/ClickHouse/pull/57988) ([Chen768959](https://github.com/Chen768959)).
+* Fix invalid preprocessing on Keeper [#58069](https://github.com/ClickHouse/ClickHouse/pull/58069) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix integer overflow in the `Poco` library, related to `UTF32Encoding` [#58073](https://github.com/ClickHouse/ClickHouse/pull/58073) ([Andrey Fedotov](https://github.com/anfedotoff)).
+* Fix parallel replicas (experimental feature) in presence of a scalar subquery with a big integer value [#58118](https://github.com/ClickHouse/ClickHouse/pull/58118) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix `accurateCastOrNull` for out-of-range `DateTime` [#58139](https://github.com/ClickHouse/ClickHouse/pull/58139) ([Andrey Zvonov](https://github.com/zvonand)).
+* Fix possible `PARAMETER_OUT_OF_BOUND` error during subcolumns reading from a wide part in MergeTree [#58175](https://github.com/ClickHouse/ClickHouse/pull/58175) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix a slow-down of CREATE VIEW with an enormous number of subqueries [#58220](https://github.com/ClickHouse/ClickHouse/pull/58220) ([Tao Wang](https://github.com/wangtZJU)).
+* Fix parallel parsing for JSONCompactEachRow [#58181](https://github.com/ClickHouse/ClickHouse/pull/58181) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#58250](https://github.com/ClickHouse/ClickHouse/pull/58250) ([Kruglov Pavel](https://github.com/Avogar)).
+
+
+### <a id="2311"></a> ClickHouse release 23.11, 2023-12-06
+
+#### Backward Incompatible Change
+* The default ClickHouse server configuration file has enabled `access_management` (user manipulation by SQL queries) and `named_collection_control` (manipulation of named collection by SQL queries) for the `default` user by default. This closes [#56482](https://github.com/ClickHouse/ClickHouse/issues/56482). [#56619](https://github.com/ClickHouse/ClickHouse/pull/56619) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Multiple improvements for `RESPECT NULLS`/`IGNORE NULLS` for window functions. If you use them as aggregate functions and store the states of aggregate functions with these modifiers, they might become incompatible. [#57189](https://github.com/ClickHouse/ClickHouse/pull/57189) ([Raúl Marín](https://github.com/Algunenano)).
+* Remove optimization `optimize_move_functions_out_of_any`. [#57190](https://github.com/ClickHouse/ClickHouse/pull/57190) ([Raúl Marín](https://github.com/Algunenano)).
+* Formatters `%l`/`%k`/`%c` in function `parseDateTime` are now able to parse hours/months without leading zeros, e.g. `select parseDateTime('2023-11-26 8:14', '%F %k:%i')` now works. Set `parsedatetime_parse_without_leading_zeros = 0` to restore the previous behavior which required two digits. Function `formatDateTime` is now also able to print hours/months without leading zeros. This is controlled by setting `formatdatetime_format_without_leading_zeros` but off by default to not break existing use cases. [#55872](https://github.com/ClickHouse/ClickHouse/pull/55872) ([Azat Khuzhin](https://github.com/azat)).
+* You can no longer use the aggregate function `avgWeighted` with arguments of type `Decimal`. Workaround: convert arguments to `Float64`. This closes [#43928](https://github.com/ClickHouse/ClickHouse/issues/43928). This closes [#31768](https://github.com/ClickHouse/ClickHouse/issues/31768). This closes [#56435](https://github.com/ClickHouse/ClickHouse/issues/56435). If you have used this function inside materialized views or projections with `Decimal` arguments, contact support@clickhouse.com. Fixed error in aggregate function `sumMap` and made it slower around 1.5..2 times. It does not matter because the function is garbage anyway. This closes [#54955](https://github.com/ClickHouse/ClickHouse/issues/54955). This closes [#53134](https://github.com/ClickHouse/ClickHouse/issues/53134). This closes [#55148](https://github.com/ClickHouse/ClickHouse/issues/55148). Fix a bug in function `groupArraySample` - it used the same random seed in case more than one aggregate state is generated in a query. [#56350](https://github.com/ClickHouse/ClickHouse/pull/56350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### New Feature
+* Added server setting `async_load_databases` for asynchronous loading of databases and tables. Speeds up the server start time. Applies to databases with `Ordinary`, `Atomic` and `Replicated` engines. Their tables load metadata asynchronously. Query to a table increases the priority of the load job and waits for it to be done. Added a new table `system.asynchronous_loader` for introspection. [#49351](https://github.com/ClickHouse/ClickHouse/pull/49351) ([Sergei Trifonov](https://github.com/serxa)).
+* Add system table `blob_storage_log`. It allows auditing all the data written to S3 and other object storages. [#52918](https://github.com/ClickHouse/ClickHouse/pull/52918) ([vdimir](https://github.com/vdimir)).
+* Use statistics to order prewhere conditions better. [#53240](https://github.com/ClickHouse/ClickHouse/pull/53240) ([Han Fei](https://github.com/hanfei1991)).
+* Added support for compression in the Keeper's protocol. It can be enabled on the ClickHouse side by using this flag `use_compression` inside `zookeeper` section. Keep in mind that only ClickHouse Keeper supports compression, while Apache ZooKeeper does not. Resolves [#49507](https://github.com/ClickHouse/ClickHouse/issues/49507). [#54957](https://github.com/ClickHouse/ClickHouse/pull/54957) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Introduce the feature `storage_metadata_write_full_object_key`. If it is set as `true` then metadata files are written with the new format. With that format ClickHouse stores full remote object key in the metadata file which allows better flexibility and optimization. [#55566](https://github.com/ClickHouse/ClickHouse/pull/55566) ([Sema Checherinda](https://github.com/CheSema)).
+* Add new settings and syntax to protect named collections' fields from being overridden. This is meant to prevent a malicious user from obtaining unauthorized access to secrets. [#55782](https://github.com/ClickHouse/ClickHouse/pull/55782) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Add `hostname` column to all system log tables - it is useful if you make the system tables replicated, shared, or distributed. [#55894](https://github.com/ClickHouse/ClickHouse/pull/55894) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add `CHECK ALL TABLES` query. [#56022](https://github.com/ClickHouse/ClickHouse/pull/56022) ([vdimir](https://github.com/vdimir)).
+* Added function `fromDaysSinceYearZero` which is similar to MySQL's `FROM_DAYS`. E.g. `SELECT fromDaysSinceYearZero(739136)` returns `2023-09-08`. [#56088](https://github.com/ClickHouse/ClickHouse/pull/56088) ([Joanna Hulboj](https://github.com/jh0x)).
+* Add an external Python tool to view backups and to extract information from them without using ClickHouse. [#56268](https://github.com/ClickHouse/ClickHouse/pull/56268) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Implement a new setting called `preferred_optimize_projection_name`. If it is set to a non-empty string, the specified projection would be used if possible instead of choosing from all the candidates. [#56309](https://github.com/ClickHouse/ClickHouse/pull/56309) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Add 4-letter command for yielding/resigning leadership (https://github.com/ClickHouse/ClickHouse/issues/56352). [#56354](https://github.com/ClickHouse/ClickHouse/pull/56354) ([Pradeep Chhetri](https://github.com/chhetripradeep)). [#56620](https://github.com/ClickHouse/ClickHouse/pull/56620) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Added a new SQL function, `arrayRandomSample(arr, k)` which returns a sample of k elements from the input array. Similar functionality could previously be achieved only with less convenient syntax, e.g. `SELECT arrayReduce('groupArraySample(3)', range(10))`. [#56416](https://github.com/ClickHouse/ClickHouse/pull/56416) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added support for `Float16` type data to use in `.npy` files. Closes [#56344](https://github.com/ClickHouse/ClickHouse/issues/56344). [#56424](https://github.com/ClickHouse/ClickHouse/pull/56424) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Added a system view `information_schema.statistics` for better compatibility with Tableau Online. [#56425](https://github.com/ClickHouse/ClickHouse/pull/56425) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Add `system.symbols` table useful for introspection of the binary. [#56548](https://github.com/ClickHouse/ClickHouse/pull/56548) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Configurable dashboards. Queries for charts are now loaded using a query, which by default uses a new `system.dashboards` table. [#56771](https://github.com/ClickHouse/ClickHouse/pull/56771) ([Sergei Trifonov](https://github.com/serxa)).
+* Introduce `fileCluster` table function - it is useful if you mount a shared filesystem (NFS and similar) into the `user_files` directory. [#56868](https://github.com/ClickHouse/ClickHouse/pull/56868) ([Andrey Zvonov](https://github.com/zvonand)).
+* Add `_size` virtual column with file size in bytes to `s3/file/hdfs/url/azureBlobStorage` engines. [#57126](https://github.com/ClickHouse/ClickHouse/pull/57126) ([Kruglov Pavel](https://github.com/Avogar)).
+* Expose the number of errors for each error code occurred on a server since last restart from the Prometheus endpoint. [#57209](https://github.com/ClickHouse/ClickHouse/pull/57209) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* ClickHouse keeper reports its running availability zone at `/keeper/availability-zone` path. This can be configured via `<availability_zone><value>us-west-1a</value></availability_zone>`. [#56715](https://github.com/ClickHouse/ClickHouse/pull/56715) ([Jianfei Hu](https://github.com/incfly)).
+* Make ALTER materialized_view MODIFY QUERY non experimental and deprecate `allow_experimental_alter_materialized_view_structure` setting. Fixes [#15206](https://github.com/ClickHouse/ClickHouse/issues/15206). [#57311](https://github.com/ClickHouse/ClickHouse/pull/57311) ([alesapin](https://github.com/alesapin)).
+* Setting `join_algorithm` respects specified order [#51745](https://github.com/ClickHouse/ClickHouse/pull/51745) ([vdimir](https://github.com/vdimir)).
+* Add support for the [well-known Protobuf types](https://protobuf.dev/reference/protobuf/google.protobuf/) in the Protobuf format. [#56741](https://github.com/ClickHouse/ClickHouse/pull/56741) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+
+#### Performance Improvement
+* Adaptive timeouts for interacting with S3. The first attempt is made with low send and receive timeouts. [#56314](https://github.com/ClickHouse/ClickHouse/pull/56314) ([Sema Checherinda](https://github.com/CheSema)).
+* Increase the default value of `max_concurrent_queries` from 100 to 1000. This makes sense when there is a large number of connecting clients, which are slowly sending or receiving data, so the server is not limited by CPU, or when the number of CPU cores is larger than 100. Also, enable the concurrency control by default, and set the desired number of query processing threads in total as twice the number of CPU cores. It improves performance in scenarios with a very large number of concurrent queries. [#46927](https://github.com/ClickHouse/ClickHouse/pull/46927) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Support parallel evaluation of window functions. Fixes [#34688](https://github.com/ClickHouse/ClickHouse/issues/34688). [#39631](https://github.com/ClickHouse/ClickHouse/pull/39631) ([Dmitry Novik](https://github.com/novikd)).
+* `Numbers` table engine (of the `system.numbers` table) now analyzes the condition to generate the needed subset of data, like table's index. [#50909](https://github.com/ClickHouse/ClickHouse/pull/50909) ([JackyWoo](https://github.com/JackyWoo)).
+* Improved the performance of filtering by `IN (...)` condition for `Merge` table engine. [#54905](https://github.com/ClickHouse/ClickHouse/pull/54905) ([Nikita Taranov](https://github.com/nickitat)).
+* An improvement which takes place when the filesystem cache is full and there are big reads. [#55158](https://github.com/ClickHouse/ClickHouse/pull/55158) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add ability to disable checksums for S3 to avoid excessive pass over the file (this is controlled by the setting `s3_disable_checksum`). [#55559](https://github.com/ClickHouse/ClickHouse/pull/55559) ([Azat Khuzhin](https://github.com/azat)).
+* Now we read synchronously from remote tables when data is in page cache (like we do for local tables). It is faster, it doesn't require synchronisation inside the thread pool, and doesn't hesitate to do `seek`-s on local FS, and reduces CPU wait. [#55841](https://github.com/ClickHouse/ClickHouse/pull/55841) ([Nikita Taranov](https://github.com/nickitat)).
+* Optimization for getting value from `map`, `arrayElement`. It will bring about 30% speedup. - reduce the reserved memory - reduce the `resize` call. [#55957](https://github.com/ClickHouse/ClickHouse/pull/55957) ([lgbo](https://github.com/lgbo-ustc)).
+* Optimization of multi-stage filtering with AVX-512. The performance experiments of the OnTime dataset on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring the improvements of 7.4%, 5.9%, 4.7%, 3.0%, and 4.6% to the QPS of the query Q2, Q3, Q4, Q5 and Q6 respectively while having no impact on others. [#56079](https://github.com/ClickHouse/ClickHouse/pull/56079) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Limit the number of threads busy inside the query profiler. If there are more - they will skip profiling. [#56105](https://github.com/ClickHouse/ClickHouse/pull/56105) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Decrease the amount of virtual function calls in window functions. [#56120](https://github.com/ClickHouse/ClickHouse/pull/56120) ([Maksim Kita](https://github.com/kitaisreal)).
+* Allow recursive Tuple field pruning in ORC data format to speed up scaning. [#56122](https://github.com/ClickHouse/ClickHouse/pull/56122) ([李扬](https://github.com/taiyang-li)).
+* Trivial count optimization for `Npy` data format: queries like `select count() from 'data.npy'` will work much more fast because of caching the results. [#56304](https://github.com/ClickHouse/ClickHouse/pull/56304) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Queries with aggregation and a large number of streams will use less amount of memory during the plan's construction. [#57074](https://github.com/ClickHouse/ClickHouse/pull/57074) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve performance of executing queries for use cases with many users and highly concurrent queries (>2000 QPS) by optimizing the access to ProcessList. [#57106](https://github.com/ClickHouse/ClickHouse/pull/57106) ([Andrej Hoos](https://github.com/adikus)).
+* Trivial improvement on array join, reuse some intermediate results. [#57183](https://github.com/ClickHouse/ClickHouse/pull/57183) ([李扬](https://github.com/taiyang-li)).
+* There are cases when stack unwinding was slow. Not anymore. [#57221](https://github.com/ClickHouse/ClickHouse/pull/57221) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Now we use default read pool for reading from external storage when `max_streams = 1`. It is beneficial when read prefetches are enabled. [#57334](https://github.com/ClickHouse/ClickHouse/pull/57334) ([Nikita Taranov](https://github.com/nickitat)).
+* Keeper improvement: improve memory-usage during startup by delaying log preprocessing. [#55660](https://github.com/ClickHouse/ClickHouse/pull/55660) ([Antonio Andelic](https://github.com/antonio2368)).
+* Improved performance of glob matching for `File` and `HDFS` storages. [#56141](https://github.com/ClickHouse/ClickHouse/pull/56141) ([Andrey Zvonov](https://github.com/zvonand)).
+* Posting lists in experimental full text indexes are now compressed which reduces their size by 10-30%. [#56226](https://github.com/ClickHouse/ClickHouse/pull/56226) ([Harry Lee](https://github.com/HarryLeeIBM)).
+* Parallelise `BackupEntriesCollector` in backups. [#56312](https://github.com/ClickHouse/ClickHouse/pull/56312) ([Kseniia Sumarokova](https://github.com/kssenii)).
+
+#### Improvement
+* Add a new `MergeTree` setting `add_implicit_sign_column_constraint_for_collapsing_engine` (disabled by default). When enabled, it adds an implicit CHECK constraint for `CollapsingMergeTree` tables that restricts the value of the `Sign` column to be only -1 or 1. [#56701](https://github.com/ClickHouse/ClickHouse/issues/56701). [#56986](https://github.com/ClickHouse/ClickHouse/pull/56986) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
+* Enable adding new disk to storage configuration without restart. [#56367](https://github.com/ClickHouse/ClickHouse/pull/56367) ([Duc Canh Le](https://github.com/canhld94)).
+* Support creating and materializing index in the same alter query, also support "modify TTL" and "materialize TTL" in the same query. Closes [#55651](https://github.com/ClickHouse/ClickHouse/issues/55651). [#56331](https://github.com/ClickHouse/ClickHouse/pull/56331) ([flynn](https://github.com/ucasfl)).
+* Add a new table function named `fuzzJSON` with rows containing perturbed versions of the source JSON string with random variations. [#56490](https://github.com/ClickHouse/ClickHouse/pull/56490) ([Julia Kartseva](https://github.com/jkartseva)).
+* Engine `Merge` filters the records according to the row policies of the underlying tables, so you don't have to create another row policy on a `Merge` table. [#50209](https://github.com/ClickHouse/ClickHouse/pull/50209) ([Ilya Golshtein](https://github.com/ilejn)).
+* Add a setting `max_execution_time_leaf` to limit the execution time on shard for distributed query, and `timeout_overflow_mode_leaf` to control the behaviour if timeout happens. [#51823](https://github.com/ClickHouse/ClickHouse/pull/51823) ([Duc Canh Le](https://github.com/canhld94)).
+* Add ClickHouse setting to disable tunneling for HTTPS requests over HTTP proxy. [#55033](https://github.com/ClickHouse/ClickHouse/pull/55033) ([Arthur Passos](https://github.com/arthurpassos)).
+* Set `background_fetches_pool_size` to 16, background_schedule_pool_size to 512 that is better for production usage with frequent small insertions. [#54327](https://github.com/ClickHouse/ClickHouse/pull/54327) ([Denny Crane](https://github.com/den-crane)).
+* While read data from a csv format file, and at end of line is `\r` , which not followed by `\n`, then we will enconter the exception as follows `Cannot parse CSV format: found \r (CR) not followed by \n (LF). Line must end by \n (LF) or \r\n (CR LF) or \n\r.` In clickhouse, the csv end of line must be `\n` or `\r\n` or `\n\r`, so the `\r` must be followed by `\n`, but in some suitation, the csv input data is abnormal, like above, `\r` is at end of line. [#54340](https://github.com/ClickHouse/ClickHouse/pull/54340) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Update Arrow library to release-13.0.0 that supports new encodings. Closes [#44505](https://github.com/ClickHouse/ClickHouse/issues/44505). [#54800](https://github.com/ClickHouse/ClickHouse/pull/54800) ([Kruglov Pavel](https://github.com/Avogar)).
+* Improve performance of ON CLUSTER queries by removing heavy system calls to get all network interfaces when looking for local ip address in the DDL entry hosts list. [#54909](https://github.com/ClickHouse/ClickHouse/pull/54909) ([Duc Canh Le](https://github.com/canhld94)).
+* Fixed accounting of memory allocated before attaching a thread to a query or a user. [#56089](https://github.com/ClickHouse/ClickHouse/pull/56089) ([Nikita Taranov](https://github.com/nickitat)).
+* Add support for `LARGE_LIST` in Apache Arrow formats. [#56118](https://github.com/ClickHouse/ClickHouse/pull/56118) ([edef](https://github.com/edef1c)).
+* Allow manual compaction of `EmbeddedRocksDB` via `OPTIMIZE` query. [#56225](https://github.com/ClickHouse/ClickHouse/pull/56225) ([Azat Khuzhin](https://github.com/azat)).
+* Add ability to specify BlockBasedTableOptions for `EmbeddedRocksDB` tables. [#56264](https://github.com/ClickHouse/ClickHouse/pull/56264) ([Azat Khuzhin](https://github.com/azat)).
+* `SHOW COLUMNS` now displays MySQL's equivalent data type name when the connection was made through the MySQL protocol. Previously, this was the case when setting `use_mysql_types_in_show_columns = 1`. The setting is retained but made obsolete. [#56277](https://github.com/ClickHouse/ClickHouse/pull/56277) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fixed possible `The local set of parts of table doesn't look like the set of parts in ZooKeeper` error if server was restarted just after `TRUNCATE` or `DROP PARTITION`. [#56282](https://github.com/ClickHouse/ClickHouse/pull/56282) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fixed handling of non-const query strings in functions `formatQuery`/ `formatQuerySingleLine`. Also added `OrNull` variants of both functions that return a NULL when a query cannot be parsed instead of throwing an exception. [#56327](https://github.com/ClickHouse/ClickHouse/pull/56327) ([Robert Schulze](https://github.com/rschu1ze)).
+* Allow backup of materialized view with dropped inner table instead of failing the backup. [#56387](https://github.com/ClickHouse/ClickHouse/pull/56387) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Queries to `system.replicas` initiate requests to ZooKeeper when certain columns are queried. When there are thousands of tables these requests might produce a considerable load on ZooKeeper. If there are multiple simultaneous queries to `system.replicas` they do same requests multiple times. The change is to "deduplicate" requests from concurrent queries. [#56420](https://github.com/ClickHouse/ClickHouse/pull/56420) ([Alexander Gololobov](https://github.com/davenger)).
+* Fix translation to MySQL compatible query for querying external databases. [#56456](https://github.com/ClickHouse/ClickHouse/pull/56456) ([flynn](https://github.com/ucasfl)).
+* Add support for backing up and restoring tables using `KeeperMap` engine. [#56460](https://github.com/ClickHouse/ClickHouse/pull/56460) ([Antonio Andelic](https://github.com/antonio2368)).
+* 404 response for CompleteMultipartUpload has to be rechecked. Operation could be done on server even if client got timeout or other network errors. The next retry of CompleteMultipartUpload receives 404 response. If the object key exists that operation is considered as successful. [#56475](https://github.com/ClickHouse/ClickHouse/pull/56475) ([Sema Checherinda](https://github.com/CheSema)).
+* Enable the HTTP OPTIONS method by default - it simplifies requesting ClickHouse from a web browser. [#56483](https://github.com/ClickHouse/ClickHouse/pull/56483) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The value for `dns_max_consecutive_failures` was changed by mistake in [#46550](https://github.com/ClickHouse/ClickHouse/issues/46550) - this is reverted and adjusted to a better value. Also, increased the HTTP keep-alive timeout to a reasonable value from production. [#56485](https://github.com/ClickHouse/ClickHouse/pull/56485) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Load base backups lazily (a base backup won't be loaded until it's needed). Also add some log message and profile events for backups. [#56516](https://github.com/ClickHouse/ClickHouse/pull/56516) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Setting `query_cache_store_results_of_queries_with_nondeterministic_functions` (with values `false` or `true`) was marked obsolete. It was replaced by setting `query_cache_nondeterministic_function_handling`, a three-valued enum that controls how the query cache handles queries with non-deterministic functions: a) throw an exception (default behavior), b) save the non-deterministic query result regardless, or c) ignore, i.e. don't throw an exception and don't cache the result. [#56519](https://github.com/ClickHouse/ClickHouse/pull/56519) ([Robert Schulze](https://github.com/rschu1ze)).
+* Rewrite equality with `is null` check in JOIN ON section. Experimental *Analyzer only*. [#56538](https://github.com/ClickHouse/ClickHouse/pull/56538) ([vdimir](https://github.com/vdimir)).
+* Function`concat` now supports arbitrary argument types (instead of only String and FixedString arguments). This makes it behave more similar to MySQL `concat` implementation. For example, `SELECT concat('ab', 42)` now returns `ab42`. [#56540](https://github.com/ClickHouse/ClickHouse/pull/56540) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Allow getting cache configuration from 'named_collection' section in config or from SQL created named collections. [#56541](https://github.com/ClickHouse/ClickHouse/pull/56541) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* PostgreSQL database engine: Make the removal of outdated tables less aggressive with unsuccessful postgres connection. [#56609](https://github.com/ClickHouse/ClickHouse/pull/56609) ([jsc0218](https://github.com/jsc0218)).
+* It took too much time to connnect to PG when URL is not right, so the relevant query stucks there and get cancelled. [#56648](https://github.com/ClickHouse/ClickHouse/pull/56648) ([jsc0218](https://github.com/jsc0218)).
+* Keeper improvement: disable compressed logs by default in Keeper. [#56763](https://github.com/ClickHouse/ClickHouse/pull/56763) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add config setting `wait_dictionaries_load_at_startup`. [#56782](https://github.com/ClickHouse/ClickHouse/pull/56782) ([Vitaly Baranov](https://github.com/vitlibar)).
+* There was a potential vulnerability in previous ClickHouse versions: if a user has connected and unsuccessfully tried to authenticate with the "interserver secret" method, the server didn't terminate the connection immediately but continued to receive and ignore the leftover packets from the client. While these packets are ignored, they are still parsed, and if they use a compression method with another known vulnerability, it will lead to exploitation of it without authentication. This issue was found with [ClickHouse Bug Bounty Program](https://github.com/ClickHouse/ClickHouse/issues/38986) by https://twitter.com/malacupa. [#56794](https://github.com/ClickHouse/ClickHouse/pull/56794) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fetching a part waits when that part is fully committed on remote replica. It is better not send part in PreActive state. In case of zero copy this is mandatory restriction. [#56808](https://github.com/ClickHouse/ClickHouse/pull/56808) ([Sema Checherinda](https://github.com/CheSema)).
+* Fix possible postgresql logical replication conversion error when using experimental `MaterializedPostgreSQL`. [#53721](https://github.com/ClickHouse/ClickHouse/pull/53721) ([takakawa](https://github.com/takakawa)).
+* Implement user-level setting `alter_move_to_space_execute_async` which allow to execute queries `ALTER TABLE ... MOVE PARTITION|PART TO DISK|VOLUME` asynchronously. The size of pool for background executions is controlled by `background_move_pool_size`. Default behavior is synchronous execution. Fixes [#47643](https://github.com/ClickHouse/ClickHouse/issues/47643). [#56809](https://github.com/ClickHouse/ClickHouse/pull/56809) ([alesapin](https://github.com/alesapin)).
+* Able to filter by engine when scanning system.tables, avoid unnecessary (potentially time-consuming) connection. [#56813](https://github.com/ClickHouse/ClickHouse/pull/56813) ([jsc0218](https://github.com/jsc0218)).
+* Show `total_bytes` and `total_rows` in system tables for RocksDB storage. [#56816](https://github.com/ClickHouse/ClickHouse/pull/56816) ([Aleksandr Musorin](https://github.com/AVMusorin)).
+* Allow basic commands in ALTER for TEMPORARY tables. [#56892](https://github.com/ClickHouse/ClickHouse/pull/56892) ([Sergey](https://github.com/icuken)).
+* LZ4 compression. Buffer compressed block in a rare case when out buffer capacity is not enough for writing compressed block directly to out's buffer. [#56938](https://github.com/ClickHouse/ClickHouse/pull/56938) ([Sema Checherinda](https://github.com/CheSema)).
+* Add metrics for the number of queued jobs, which is useful for the IO thread pool. [#56958](https://github.com/ClickHouse/ClickHouse/pull/56958) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add a setting for PostgreSQL table engine setting in the config file. Added a check for the setting Added documentation around the additional setting. [#56959](https://github.com/ClickHouse/ClickHouse/pull/56959) ([Peignon Melvyn](https://github.com/melvynator)).
+* Function `concat` can now be called with a single argument, e.g., `SELECT concat('abc')`. This makes its behavior more consistent with MySQL's concat implementation. [#57000](https://github.com/ClickHouse/ClickHouse/pull/57000) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Signs all `x-amz-*` headers as required by AWS S3 docs. [#57001](https://github.com/ClickHouse/ClickHouse/pull/57001) ([Arthur Passos](https://github.com/arthurpassos)).
+* Function `fromDaysSinceYearZero` (alias: `FROM_DAYS`) can now be used with unsigned and signed integer types (previously, it had to be an unsigned integer). This improve compatibility with 3rd party tools such as Tableau Online. [#57002](https://github.com/ClickHouse/ClickHouse/pull/57002) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Add `system.s3queue_log` to default config. [#57036](https://github.com/ClickHouse/ClickHouse/pull/57036) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Change the default for `wait_dictionaries_load_at_startup` to true, and use this setting only if `dictionaries_lazy_load` is false. [#57133](https://github.com/ClickHouse/ClickHouse/pull/57133) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Check dictionary source type on creation even if `dictionaries_lazy_load` is enabled. [#57134](https://github.com/ClickHouse/ClickHouse/pull/57134) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Plan-level optimizations can now be enabled/disabled individually. Previously, it was only possible to disable them all. The setting which previously did that (`query_plan_enable_optimizations`) is retained and can still be used to disable all optimizations. [#57152](https://github.com/ClickHouse/ClickHouse/pull/57152) ([Robert Schulze](https://github.com/rschu1ze)).
+* The server's exit code will correspond to the exception code. For example, if the server cannot start due to memory limit, it will exit with the code 241 = MEMORY_LIMIT_EXCEEDED. In previous versions, the exit code for exceptions was always 70 = Poco::Util::ExitCode::EXIT_SOFTWARE. [#57153](https://github.com/ClickHouse/ClickHouse/pull/57153) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Do not demangle and symbolize stack frames from `functional` C++ header. [#57201](https://github.com/ClickHouse/ClickHouse/pull/57201) ([Mike Kot](https://github.com/myrrc)).
+* HTTP server page `/dashboard` now supports charts with multiple lines. [#57236](https://github.com/ClickHouse/ClickHouse/pull/57236) ([Sergei Trifonov](https://github.com/serxa)).
+* The `max_memory_usage_in_client` command line option supports a string value with a suffix (K, M, G, etc). Closes [#56879](https://github.com/ClickHouse/ClickHouse/issues/56879). [#57273](https://github.com/ClickHouse/ClickHouse/pull/57273) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Bumped Intel QPL (used by codec `DEFLATE_QPL`) from v1.2.0 to v1.3.1 . Also fixed a bug in case of BOF (Block On Fault) = 0, changed to handle page faults by falling back to SW path. [#57291](https://github.com/ClickHouse/ClickHouse/pull/57291) ([jasperzhu](https://github.com/jinjunzh)).
+* Increase default `replicated_deduplication_window` of MergeTree settings from 100 to 1k. [#57335](https://github.com/ClickHouse/ClickHouse/pull/57335) ([sichenzhao](https://github.com/sichenzhao)).
+* Stop using `INCONSISTENT_METADATA_FOR_BACKUP` that much. If possible prefer to continue scanning instead of stopping and starting the scanning for backup from the beginning. [#57385](https://github.com/ClickHouse/ClickHouse/pull/57385) ([Vitaly Baranov](https://github.com/vitlibar)).
+
+#### Build/Testing/Packaging Improvement
+* Add SQLLogic test. [#56078](https://github.com/ClickHouse/ClickHouse/pull/56078) ([Han Fei](https://github.com/hanfei1991)).
+* Make `clickhouse-local` and `clickhouse-client` available under short names (`ch`, `chl`, `chc`) for usability. [#56634](https://github.com/ClickHouse/ClickHouse/pull/56634) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Optimized build size further by removing unused code from external libraries. [#56786](https://github.com/ClickHouse/ClickHouse/pull/56786) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add automatic check that there are no large translation units. [#56559](https://github.com/ClickHouse/ClickHouse/pull/56559) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Lower the size of the single-binary distribution. This closes [#55181](https://github.com/ClickHouse/ClickHouse/issues/55181). [#56617](https://github.com/ClickHouse/ClickHouse/pull/56617) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Information about the sizes of every translation unit and binary file after each build will be sent to the CI database in ClickHouse Cloud. This closes [#56107](https://github.com/ClickHouse/ClickHouse/issues/56107). [#56636](https://github.com/ClickHouse/ClickHouse/pull/56636) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Certain files of "Apache Arrow" library (which we use only for non-essential things like parsing the arrow format) were rebuilt all the time regardless of the build cache. This is fixed. [#56657](https://github.com/ClickHouse/ClickHouse/pull/56657) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Avoid recompiling translation units depending on the autogenerated source file about version. [#56660](https://github.com/ClickHouse/ClickHouse/pull/56660) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Tracing data of the linker invocations will be sent to the CI database in ClickHouse Cloud. [#56725](https://github.com/ClickHouse/ClickHouse/pull/56725) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Use DWARF 5 debug symbols for the clickhouse binary (was DWARF 4 previously). [#56770](https://github.com/ClickHouse/ClickHouse/pull/56770) ([Michael Kolupaev](https://github.com/al13n321)).
+* Add a new build option `SANITIZE_COVERAGE`. If it is enabled, the code is instrumented to track the coverage. The collected information is available inside ClickHouse with: (1) a new function `coverage` that returns an array of unique addresses in the code found after the previous coverage reset; (2) `SYSTEM RESET COVERAGE` query that resets the accumulated data. This allows us to compare the coverage of different tests, including differential code coverage. Continuation of [#20539](https://github.com/ClickHouse/ClickHouse/issues/20539). [#56102](https://github.com/ClickHouse/ClickHouse/pull/56102) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Some of the stack frames might not be resolved when collecting stacks. In such cases the raw address might be helpful. [#56267](https://github.com/ClickHouse/ClickHouse/pull/56267) ([Alexander Gololobov](https://github.com/davenger)).
+* Add an option to disable `libssh`. [#56333](https://github.com/ClickHouse/ClickHouse/pull/56333) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Enable temporary_data_in_cache in S3 tests in CI. [#48425](https://github.com/ClickHouse/ClickHouse/pull/48425) ([vdimir](https://github.com/vdimir)).
+* Set the max memory usage for clickhouse-client (`1G`) in the CI. [#56873](https://github.com/ClickHouse/ClickHouse/pull/56873) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+* Fix exerimental Analyzer - insertion from select with subquery referencing insertion table should process only insertion block. [#50857](https://github.com/ClickHouse/ClickHouse/pull/50857) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Fix a bug in `str_to_map` function. [#56423](https://github.com/ClickHouse/ClickHouse/pull/56423) ([Arthur Passos](https://github.com/arthurpassos)).
+* Keeper `reconfig`: add timeout before yielding/taking leadership [#53481](https://github.com/ClickHouse/ClickHouse/pull/53481) ([Mike Kot](https://github.com/myrrc)).
+* Fix incorrect header in grace hash join and filter pushdown [#53922](https://github.com/ClickHouse/ClickHouse/pull/53922) ([vdimir](https://github.com/vdimir)).
+* Select from system tables when table based on table function. [#55540](https://github.com/ClickHouse/ClickHouse/pull/55540) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* RFC: Fix "Cannot find column X in source stream" for Distributed queries with LIMIT BY [#55836](https://github.com/ClickHouse/ClickHouse/pull/55836) ([Azat Khuzhin](https://github.com/azat)).
+* Fix 'Cannot read from file:' while running client in a background [#55976](https://github.com/ClickHouse/ClickHouse/pull/55976) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix clickhouse-local exit on bad send_logs_level setting [#55994](https://github.com/ClickHouse/ClickHouse/pull/55994) ([Kruglov Pavel](https://github.com/Avogar)).
+* Bug fix explain ast with parameterized view [#56004](https://github.com/ClickHouse/ClickHouse/pull/56004) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix a crash during table loading on startup [#56232](https://github.com/ClickHouse/ClickHouse/pull/56232) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix ClickHouse-sourced dictionaries with an explicit query [#56236](https://github.com/ClickHouse/ClickHouse/pull/56236) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix segfault in signal handler for Keeper [#56266](https://github.com/ClickHouse/ClickHouse/pull/56266) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix incomplete query result for UNION in view() function. [#56274](https://github.com/ClickHouse/ClickHouse/pull/56274) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix inconsistency of "cast('0' as DateTime64(3))" and "cast('0' as Nullable(DateTime64(3)))" [#56286](https://github.com/ClickHouse/ClickHouse/pull/56286) ([李扬](https://github.com/taiyang-li)).
+* Fix rare race condition related to Memory allocation failure [#56303](https://github.com/ClickHouse/ClickHouse/pull/56303) ([alesapin](https://github.com/alesapin)).
+* Fix restore from backup with `flatten_nested` and `data_type_default_nullable` [#56306](https://github.com/ClickHouse/ClickHouse/pull/56306) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix crash in case of adding a column with type Object(JSON) [#56307](https://github.com/ClickHouse/ClickHouse/pull/56307) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix crash in filterPushDown [#56380](https://github.com/ClickHouse/ClickHouse/pull/56380) ([vdimir](https://github.com/vdimir)).
+* Fix restore from backup with mat view and dropped source table [#56383](https://github.com/ClickHouse/ClickHouse/pull/56383) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix segfault during Kerberos initialization [#56401](https://github.com/ClickHouse/ClickHouse/pull/56401) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix buffer overflow in T64 [#56434](https://github.com/ClickHouse/ClickHouse/pull/56434) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix nullable primary key in final (2) [#56452](https://github.com/ClickHouse/ClickHouse/pull/56452) ([Amos Bird](https://github.com/amosbird)).
+* Fix ON CLUSTER queries without database on initial node [#56484](https://github.com/ClickHouse/ClickHouse/pull/56484) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix startup failure due to TTL dependency [#56489](https://github.com/ClickHouse/ClickHouse/pull/56489) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix ALTER COMMENT queries ON CLUSTER [#56491](https://github.com/ClickHouse/ClickHouse/pull/56491) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix ALTER COLUMN with ALIAS [#56493](https://github.com/ClickHouse/ClickHouse/pull/56493) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix empty NAMED COLLECTIONs [#56494](https://github.com/ClickHouse/ClickHouse/pull/56494) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix two cases of projection analysis. [#56502](https://github.com/ClickHouse/ClickHouse/pull/56502) ([Amos Bird](https://github.com/amosbird)).
+* Fix handling of aliases in query cache [#56545](https://github.com/ClickHouse/ClickHouse/pull/56545) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix conversion from `Nullable(Enum)` to `Nullable(String)` [#56644](https://github.com/ClickHouse/ClickHouse/pull/56644) ([Nikolay Degterinsky](https://github.com/evillique)).
+* More reliable log handling in Keeper [#56670](https://github.com/ClickHouse/ClickHouse/pull/56670) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix configuration merge for nodes with substitution attributes [#56694](https://github.com/ClickHouse/ClickHouse/pull/56694) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Fix duplicate usage of table function input(). [#56695](https://github.com/ClickHouse/ClickHouse/pull/56695) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix: RabbitMQ OpenSSL dynamic loading issue [#56703](https://github.com/ClickHouse/ClickHouse/pull/56703) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix crash in GCD codec in case when zeros present in data [#56704](https://github.com/ClickHouse/ClickHouse/pull/56704) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix 'mutex lock failed: Invalid argument' in clickhouse-local during insert into function [#56710](https://github.com/ClickHouse/ClickHouse/pull/56710) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix Date text parsing in optimistic path [#56765](https://github.com/ClickHouse/ClickHouse/pull/56765) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash in FPC codec [#56795](https://github.com/ClickHouse/ClickHouse/pull/56795) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* DatabaseReplicated: fix DDL query timeout after recovering a replica [#56796](https://github.com/ClickHouse/ClickHouse/pull/56796) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix incorrect nullable columns reporting in MySQL binary protocol [#56799](https://github.com/ClickHouse/ClickHouse/pull/56799) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Support Iceberg metadata files for metastore tables [#56810](https://github.com/ClickHouse/ClickHouse/pull/56810) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix TSAN report under transform [#56817](https://github.com/ClickHouse/ClickHouse/pull/56817) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix SET query and SETTINGS formatting [#56825](https://github.com/ClickHouse/ClickHouse/pull/56825) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix failure to start due to table dependency in joinGet [#56828](https://github.com/ClickHouse/ClickHouse/pull/56828) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix flattening existing Nested columns during ADD COLUMN [#56830](https://github.com/ClickHouse/ClickHouse/pull/56830) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix allow cr end of line for csv [#56901](https://github.com/ClickHouse/ClickHouse/pull/56901) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Fix `tryBase64Decode` with invalid input [#56913](https://github.com/ClickHouse/ClickHouse/pull/56913) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix generating deep nested columns in CapnProto/Protobuf schemas [#56941](https://github.com/ClickHouse/ClickHouse/pull/56941) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prevent incompatible ALTER of projection columns [#56948](https://github.com/ClickHouse/ClickHouse/pull/56948) ([Amos Bird](https://github.com/amosbird)).
+* Fix sqlite file path validation [#56984](https://github.com/ClickHouse/ClickHouse/pull/56984) ([San](https://github.com/santrancisco)).
+* S3Queue: fix metadata reference increment [#56990](https://github.com/ClickHouse/ClickHouse/pull/56990) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* S3Queue minor fix [#56999](https://github.com/ClickHouse/ClickHouse/pull/56999) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix file path validation for DatabaseFileSystem [#57029](https://github.com/ClickHouse/ClickHouse/pull/57029) ([San](https://github.com/santrancisco)).
+* Fix `fuzzBits` with `ARRAY JOIN` [#57033](https://github.com/ClickHouse/ClickHouse/pull/57033) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix Nullptr dereference in partial merge join with joined_subquery_re… [#57048](https://github.com/ClickHouse/ClickHouse/pull/57048) ([vdimir](https://github.com/vdimir)).
+* Fix race condition in RemoteSource [#57052](https://github.com/ClickHouse/ClickHouse/pull/57052) ([Raúl Marín](https://github.com/Algunenano)).
+* Implement `bitHammingDistance` for big integers [#57073](https://github.com/ClickHouse/ClickHouse/pull/57073) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* S3-style links bug fix [#57075](https://github.com/ClickHouse/ClickHouse/pull/57075) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix JSON_QUERY function with multiple numeric paths [#57096](https://github.com/ClickHouse/ClickHouse/pull/57096) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Fix buffer overflow in Gorilla codec [#57107](https://github.com/ClickHouse/ClickHouse/pull/57107) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Close interserver connection on any exception before authentication [#57142](https://github.com/ClickHouse/ClickHouse/pull/57142) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix segfault after ALTER UPDATE with Nullable MATERIALIZED column [#57147](https://github.com/ClickHouse/ClickHouse/pull/57147) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix incorrect JOIN plan optimization with partially materialized normal projection [#57196](https://github.com/ClickHouse/ClickHouse/pull/57196) ([Amos Bird](https://github.com/amosbird)).
+* Ignore comments when comparing column descriptions [#57259](https://github.com/ClickHouse/ClickHouse/pull/57259) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix `ReadonlyReplica` metric for all cases [#57267](https://github.com/ClickHouse/ClickHouse/pull/57267) ([Antonio Andelic](https://github.com/antonio2368)).
+* Background merges correctly use temporary data storage in the cache [#57275](https://github.com/ClickHouse/ClickHouse/pull/57275) ([vdimir](https://github.com/vdimir)).
+* Keeper fix for changelog and snapshots [#57299](https://github.com/ClickHouse/ClickHouse/pull/57299) ([Antonio Andelic](https://github.com/antonio2368)).
+* Ignore finished ON CLUSTER tasks if hostname changed [#57339](https://github.com/ClickHouse/ClickHouse/pull/57339) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* MergeTree mutations reuse source part index granularity [#57352](https://github.com/ClickHouse/ClickHouse/pull/57352) ([Maksim Kita](https://github.com/kitaisreal)).
+* FS cache: add a limit for background download [#57424](https://github.com/ClickHouse/ClickHouse/pull/57424) ([Kseniia Sumarokova](https://github.com/kssenii)).
+
+
+### <a id="2310"></a> ClickHouse release 23.10, 2023-11-02
 
 #### Backward Incompatible Change
 * There is no longer an option to automatically remove broken data parts. This closes [#55174](https://github.com/ClickHouse/ClickHouse/issues/55174). [#55184](https://github.com/ClickHouse/ClickHouse/pull/55184) ([Alexey Milovidov](https://github.com/alexey-milovidov)). [#55557](https://github.com/ClickHouse/ClickHouse/pull/55557) ([Jihyuk Bok](https://github.com/tomahawk28)).
@@ -39,7 +391,7 @@
 * Allow to drop cache for Protobuf format with `SYSTEM DROP SCHEMA FORMAT CACHE [FOR Protobuf]`. [#55064](https://github.com/ClickHouse/ClickHouse/pull/55064) ([Aleksandr Musorin](https://github.com/AVMusorin)).
 * Add external HTTP Basic authenticator. [#55199](https://github.com/ClickHouse/ClickHouse/pull/55199) ([Aleksei Filatov](https://github.com/aalexfvk)).
 * Added function `byteSwap` which reverses the bytes of unsigned integers. This is particularly useful for reversing values of types which are represented as unsigned integers internally such as IPv4. [#55211](https://github.com/ClickHouse/ClickHouse/pull/55211) ([Priyansh Agrawal](https://github.com/Priyansh121096)).
-* Added function `formatQuery()` which returns a formatted version (possibly spanning multiple lines) of a SQL query string. Also added function `formatQuerySingleLine()` which does the same but the returned string will not contain linebreaks. [#55239](https://github.com/ClickHouse/ClickHouse/pull/55239) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Added function `formatQuery` which returns a formatted version (possibly spanning multiple lines) of a SQL query string. Also added function `formatQuerySingleLine` which does the same but the returned string will not contain linebreaks. [#55239](https://github.com/ClickHouse/ClickHouse/pull/55239) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
 * Added `DWARF` input format that reads debug symbols from an ELF executable/library/object file. [#55450](https://github.com/ClickHouse/ClickHouse/pull/55450) ([Michael Kolupaev](https://github.com/al13n321)).
 * Allow to save unparsed records and errors in RabbitMQ, NATS and FileLog engines. Add virtual columns `_error` and `_raw_message`(for NATS and RabbitMQ), `_raw_record` (for FileLog) that are filled when ClickHouse fails to parse new record. The behaviour is controlled under storage settings `nats_handle_error_mode` for NATS, `rabbitmq_handle_error_mode` for RabbitMQ, `handle_error_mode` for FileLog similar to `kafka_handle_error_mode`. If it's set to `default`, en exception will be thrown when ClickHouse fails to parse a record, if it's set to `stream`, erorr and raw record will be saved into virtual columns. Closes [#36035](https://github.com/ClickHouse/ClickHouse/issues/36035). [#55477](https://github.com/ClickHouse/ClickHouse/pull/55477) ([Kruglov Pavel](https://github.com/Avogar)).
 * Keeper client improvement: add `get_all_children_number command` that returns number of all children nodes under a specific path. [#55485](https://github.com/ClickHouse/ClickHouse/pull/55485) ([guoxiaolong](https://github.com/guoxiaolongzte)).
@@ -74,11 +426,11 @@
 * Reduced memory consumption during loading of hierarchical dictionaries. [#55838](https://github.com/ClickHouse/ClickHouse/pull/55838) ([Nikita Taranov](https://github.com/nickitat)).
 * All dictionaries support setting `dictionary_use_async_executor`. [#55839](https://github.com/ClickHouse/ClickHouse/pull/55839) ([vdimir](https://github.com/vdimir)).
 * Prevent excesive memory usage when deserializing AggregateFunctionTopKGenericData. [#55947](https://github.com/ClickHouse/ClickHouse/pull/55947) ([Raúl Marín](https://github.com/Algunenano)).
-* On a Keeper with lots of watches AsyncMetrics threads can consume 100% of CPU for noticable time in `DB::KeeperStorage::getSessionsWithWatchesCount()`. The fix is to avoid traversing heavy `watches` and `list_watches` sets. [#56054](https://github.com/ClickHouse/ClickHouse/pull/56054) ([Alexander Gololobov](https://github.com/davenger)).
-* Add setting `optimize_trivial_approximate_count_query` to use `count()` approximation for storage EmbeddedRocksDB. Enable trivial count for StorageJoin. [#55806](https://github.com/ClickHouse/ClickHouse/pull/55806) ([Duc Canh Le](https://github.com/canhld94)).
+* On a Keeper with lots of watches AsyncMetrics threads can consume 100% of CPU for noticable time in `DB::KeeperStorage::getSessionsWithWatchesCount`. The fix is to avoid traversing heavy `watches` and `list_watches` sets. [#56054](https://github.com/ClickHouse/ClickHouse/pull/56054) ([Alexander Gololobov](https://github.com/davenger)).
+* Add setting `optimize_trivial_approximate_count_query` to use `count` approximation for storage EmbeddedRocksDB. Enable trivial count for StorageJoin. [#55806](https://github.com/ClickHouse/ClickHouse/pull/55806) ([Duc Canh Le](https://github.com/canhld94)).
 
 #### Improvement
-* Functions `toDayOfWeek()` (MySQL alias: `DAYOFWEEK()`), `toYearWeek()` (`YEARWEEK()`) and `toWeek()` (`WEEK()`) now supports `String` arguments. This makes its behavior consistent with MySQL's behavior. [#55589](https://github.com/ClickHouse/ClickHouse/pull/55589) ([Robert Schulze](https://github.com/rschu1ze)).
+* Functions `toDayOfWeek` (MySQL alias: `DAYOFWEEK`), `toYearWeek` (`YEARWEEK`) and `toWeek` (`WEEK`) now supports `String` arguments. This makes its behavior consistent with MySQL's behavior. [#55589](https://github.com/ClickHouse/ClickHouse/pull/55589) ([Robert Schulze](https://github.com/rschu1ze)).
 * Introduced setting `date_time_overflow_behavior` with possible values `ignore`, `throw`, `saturate` that controls the overflow behavior when converting from Date, Date32, DateTime64, Integer or Float to Date, Date32, DateTime or DateTime64. [#55696](https://github.com/ClickHouse/ClickHouse/pull/55696) ([Andrey Zvonov](https://github.com/zvonand)).
 * Implement query parameters support for `ALTER TABLE ... ACTION PARTITION [ID] {parameter_name:ParameterType}`. Merges [#49516](https://github.com/ClickHouse/ClickHouse/issues/49516). Closes [#49449](https://github.com/ClickHouse/ClickHouse/issues/49449). [#55604](https://github.com/ClickHouse/ClickHouse/pull/55604) ([alesapin](https://github.com/alesapin)).
 * Print processor ids in a prettier manner in EXPLAIN. [#48852](https://github.com/ClickHouse/ClickHouse/pull/48852) ([Vlad Seliverstov](https://github.com/behebot)).
@@ -112,7 +464,7 @@
 * Functions `(add|subtract)(Year|Quarter|Month|Week|Day|Hour|Minute|Second|Millisecond|Microsecond|Nanosecond)` now support string-encoded date arguments, e.g. `SELECT addDays('2023-10-22', 1)`. This increases compatibility with MySQL and is needed by Tableau Online. [#55869](https://github.com/ClickHouse/ClickHouse/pull/55869) ([Robert Schulze](https://github.com/rschu1ze)).
 * The setting `apply_deleted_mask` when disabled allows to read rows that where marked as deleted by lightweight DELETE queries. This is useful for debugging. [#55952](https://github.com/ClickHouse/ClickHouse/pull/55952) ([Alexander Gololobov](https://github.com/davenger)).
 * Allow skipping `null` values when serailizing Tuple to json objects, which makes it possible to keep compatiability with Spark's `to_json` function, which is also useful for gluten. [#55956](https://github.com/ClickHouse/ClickHouse/pull/55956) ([李扬](https://github.com/taiyang-li)).
-* Functions `(add|sub)Date()` now support string-encoded date arguments, e.g. `SELECT addDate('2023-10-22 11:12:13', INTERVAL 5 MINUTE)`. The same support for string-encoded date arguments is added to the plus and minus operators, e.g. `SELECT '2023-10-23' + INTERVAL 1 DAY`. This increases compatibility with MySQL and is needed by Tableau Online. [#55960](https://github.com/ClickHouse/ClickHouse/pull/55960) ([Robert Schulze](https://github.com/rschu1ze)).
+* Functions `(add|sub)Date` now support string-encoded date arguments, e.g. `SELECT addDate('2023-10-22 11:12:13', INTERVAL 5 MINUTE)`. The same support for string-encoded date arguments is added to the plus and minus operators, e.g. `SELECT '2023-10-23' + INTERVAL 1 DAY`. This increases compatibility with MySQL and is needed by Tableau Online. [#55960](https://github.com/ClickHouse/ClickHouse/pull/55960) ([Robert Schulze](https://github.com/rschu1ze)).
 * Allow unquoted strings with CR (`\r`) in CSV format. Closes [#39930](https://github.com/ClickHouse/ClickHouse/issues/39930). [#56046](https://github.com/ClickHouse/ClickHouse/pull/56046) ([Kruglov Pavel](https://github.com/Avogar)).
 * Allow to run `clickhouse-keeper` using embedded config. [#56086](https://github.com/ClickHouse/ClickHouse/pull/56086) ([Maksim Kita](https://github.com/kitaisreal)).
 * Set limit of the maximum configuration value for `queued.min.messages` to avoid problem with start fetching data with Kafka. [#56121](https://github.com/ClickHouse/ClickHouse/pull/56121) ([Stas Morozov](https://github.com/r3b-fish)).
@@ -133,7 +485,7 @@
 * Fixed bug of `match` function (regex) with pattern containing alternation produces incorrect key condition. Closes #53222. [#54696](https://github.com/ClickHouse/ClickHouse/pull/54696) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
 * Fix 'Cannot find column' in read-in-order optimization with ARRAY JOIN [#51746](https://github.com/ClickHouse/ClickHouse/pull/51746) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
 * Support missed experimental `Object(Nullable(json))` subcolumns in query. [#54052](https://github.com/ClickHouse/ClickHouse/pull/54052) ([zps](https://github.com/VanDarkholme7)).
-* Re-add fix for `accurateCastOrNull()` [#54629](https://github.com/ClickHouse/ClickHouse/pull/54629) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Re-add fix for `accurateCastOrNull` [#54629](https://github.com/ClickHouse/ClickHouse/pull/54629) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
 * Fix detecting `DEFAULT` for columns of a Distributed table created without AS [#55060](https://github.com/ClickHouse/ClickHouse/pull/55060) ([Vitaly Baranov](https://github.com/vitlibar)).
 * Proper cleanup in case of exception in ctor of ShellCommandSource [#55103](https://github.com/ClickHouse/ClickHouse/pull/55103) ([Alexander Gololobov](https://github.com/davenger)).
 * Fix deadlock in LDAP assigned role update [#55119](https://github.com/ClickHouse/ClickHouse/pull/55119) ([Julian Maicher](https://github.com/jmaicher)).
@@ -191,7 +543,7 @@
 * Add error handler to odbc-bridge [#56185](https://github.com/ClickHouse/ClickHouse/pull/56185) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
 
 
-### ClickHouse release 23.9, 2023-09-28
+### <a id="239"></a> ClickHouse release 23.9, 2023-09-28
 
 #### Backward Incompatible Change
 * Remove the `status_info` configuration option and dictionaries status from the default Prometheus handler. [#54090](https://github.com/ClickHouse/ClickHouse/pull/54090) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
@@ -213,7 +565,7 @@
 * Add function `decodeHTMLComponent`. [#54097](https://github.com/ClickHouse/ClickHouse/pull/54097) ([Bharat Nallan](https://github.com/bharatnc)).
 * Added `peak_threads_usage` to query_log table. [#54335](https://github.com/ClickHouse/ClickHouse/pull/54335) ([Alexey Gerasimchuck](https://github.com/Demilivor)).
 * Add `SHOW FUNCTIONS` support to clickhouse-client. [#54337](https://github.com/ClickHouse/ClickHouse/pull/54337) ([Julia Kartseva](https://github.com/wat-ze-hex)).
-* Added function `toDaysSinceYearZero` with alias `TO_DAYS` (for compatibility with MySQL) which returns the number of days passed since `0001-01-01` (in Proleptic Gregorian Calendar). [#54479](https://github.com/ClickHouse/ClickHouse/pull/54479) ([Robert Schulze](https://github.com/rschu1ze)). Function `toDaysSinceYearZero()` now supports arguments of type `DateTime` and `DateTime64`. [#54856](https://github.com/ClickHouse/ClickHouse/pull/54856) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Added function `toDaysSinceYearZero` with alias `TO_DAYS` (for compatibility with MySQL) which returns the number of days passed since `0001-01-01` (in Proleptic Gregorian Calendar). [#54479](https://github.com/ClickHouse/ClickHouse/pull/54479) ([Robert Schulze](https://github.com/rschu1ze)). Function `toDaysSinceYearZero` now supports arguments of type `DateTime` and `DateTime64`. [#54856](https://github.com/ClickHouse/ClickHouse/pull/54856) ([Serge Klochkov](https://github.com/slvrtrn)).
 * Added functions `YYYYMMDDtoDate`, `YYYYMMDDtoDate32`, `YYYYMMDDhhmmssToDateTime` and `YYYYMMDDhhmmssToDateTime64`. They convert a date or date with time encoded as integer (e.g. 20230911) into a native date or date with time. As such, they provide the opposite functionality of existing functions `YYYYMMDDToDate`, `YYYYMMDDToDateTime`, `YYYYMMDDhhmmddToDateTime`, `YYYYMMDDhhmmddToDateTime64`. [#54509](https://github.com/ClickHouse/ClickHouse/pull/54509) ([Quanfa Fu](https://github.com/dentiscalprum)) ([Robert Schulze](https://github.com/rschu1ze)).
 * Add several string distance functions, including `byteHammingDistance`, `editDistance`. [#54935](https://github.com/ClickHouse/ClickHouse/pull/54935) ([flynn](https://github.com/ucasfl)).
 * Allow specifying the expiration date and, optionally, the time for user credentials with `VALID UNTIL datetime` clause. [#51261](https://github.com/ClickHouse/ClickHouse/pull/51261) ([Nikolay Degterinsky](https://github.com/evillique)).
@@ -229,7 +581,7 @@
 * An optimization to rewrite `COUNT(DISTINCT ...)` and various `uniq` variants to `count` if it is selected from a subquery with GROUP BY. [#52082](https://github.com/ClickHouse/ClickHouse/pull/52082) [#52645](https://github.com/ClickHouse/ClickHouse/pull/52645) ([JackyWoo](https://github.com/JackyWoo)).
 * Remove manual calls to `mmap/mremap/munmap` and delegate all this work to `jemalloc` - and it slightly improves performance. [#52792](https://github.com/ClickHouse/ClickHouse/pull/52792) ([Nikita Taranov](https://github.com/nickitat)).
 * Fixed high in CPU consumption when working with NATS. [#54399](https://github.com/ClickHouse/ClickHouse/pull/54399) ([Vasilev Pyotr](https://github.com/vahpetr)).
-* Since we use separate instructions for executing `toString()` with datetime argument, it is possible to improve performance a bit for non-datetime arguments and have some parts of the code cleaner. Follows up [#53680](https://github.com/ClickHouse/ClickHouse/issues/53680). [#54443](https://github.com/ClickHouse/ClickHouse/pull/54443) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Since we use separate instructions for executing `toString` with datetime argument, it is possible to improve performance a bit for non-datetime arguments and have some parts of the code cleaner. Follows up [#53680](https://github.com/ClickHouse/ClickHouse/issues/53680). [#54443](https://github.com/ClickHouse/ClickHouse/pull/54443) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
 * Instead of serializing json elements into a `std::stringstream`, this PR try to put the serialization result into `ColumnString` direclty. [#54613](https://github.com/ClickHouse/ClickHouse/pull/54613) ([lgbo](https://github.com/lgbo-ustc)).
 * Enable ORDER BY optimization for reading data in corresponding order from a MergeTree table in case that the table is behind a view. [#54628](https://github.com/ClickHouse/ClickHouse/pull/54628) ([Vitaly Baranov](https://github.com/vitlibar)).
 * Improve JSON SQL functions by reusing `GeneratorJSONPath` and removing several shared pointers. [#54735](https://github.com/ClickHouse/ClickHouse/pull/54735) ([lgbo](https://github.com/lgbo-ustc)).
@@ -479,7 +831,7 @@
 * The `domainRFC` function now supports IPv6 in square brackets. [#53506](https://github.com/ClickHouse/ClickHouse/pull/53506) ([Chen768959](https://github.com/Chen768959)).
 * Use longer timeout for S3 CopyObject requests, which are used in backups. [#53533](https://github.com/ClickHouse/ClickHouse/pull/53533) ([Michael Kolupaev](https://github.com/al13n321)).
 * Added server setting `aggregate_function_group_array_max_element_size`. This setting is used to limit array size for `groupArray` function at serialization. The default value is `16777215`. [#53550](https://github.com/ClickHouse/ClickHouse/pull/53550) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
-* `SCHEMA()` was added as alias for `DATABASE()` to improve MySQL compatibility. [#53587](https://github.com/ClickHouse/ClickHouse/pull/53587) ([Daniël van Eeden](https://github.com/dveeden)).
+* `SCHEMA` was added as alias for `DATABASE` to improve MySQL compatibility. [#53587](https://github.com/ClickHouse/ClickHouse/pull/53587) ([Daniël van Eeden](https://github.com/dveeden)).
 * Add asynchronous metrics about tables in the system database. For example, `TotalBytesOfMergeTreeTablesSystem`. This closes [#53603](https://github.com/ClickHouse/ClickHouse/issues/53603). [#53604](https://github.com/ClickHouse/ClickHouse/pull/53604) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
 * SQL editor in the Play UI and Dashboard will not use Grammarly. [#53614](https://github.com/ClickHouse/ClickHouse/pull/53614) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
 * As expert-level settings, it is now possible to (1) configure the size_ratio (i.e. the relative size of the protected queue) of the [index] mark/uncompressed caches, (2) configure the cache policy of the index mark and index uncompressed caches. [#53657](https://github.com/ClickHouse/ClickHouse/pull/53657) ([Robert Schulze](https://github.com/rschu1ze)).
@@ -741,7 +1093,7 @@
 * Disable expression templates for time intervals [#52335](https://github.com/ClickHouse/ClickHouse/pull/52335) ([Alexander Tokmakov](https://github.com/tavplubix)).
 * Fix `apply_snapshot` in Keeper [#52358](https://github.com/ClickHouse/ClickHouse/pull/52358) ([Antonio Andelic](https://github.com/antonio2368)).
 * Update build-osx.md [#52377](https://github.com/ClickHouse/ClickHouse/pull/52377) ([AlexBykovski](https://github.com/AlexBykovski)).
-* Fix `countSubstrings()` hang with empty needle and a column haystack [#52409](https://github.com/ClickHouse/ClickHouse/pull/52409) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix `countSubstrings` hang with empty needle and a column haystack [#52409](https://github.com/ClickHouse/ClickHouse/pull/52409) ([Sergei Trifonov](https://github.com/serxa)).
 * Fix normal projection with merge table  [#52432](https://github.com/ClickHouse/ClickHouse/pull/52432) ([Amos Bird](https://github.com/amosbird)).
 * Fix possible double-free in Aggregator [#52439](https://github.com/ClickHouse/ClickHouse/pull/52439) ([Nikita Taranov](https://github.com/nickitat)).
 * Fixed inserting into Buffer engine [#52440](https://github.com/ClickHouse/ClickHouse/pull/52440) ([Vasily Nemkov](https://github.com/Enmk)).
@@ -1585,7 +1937,7 @@
 * A couple of segfaults have been reported around `c-ares`. They were introduced in my previous pull requests. I have fixed them with the help of Alexander Tokmakov. [#45629](https://github.com/ClickHouse/ClickHouse/pull/45629) ([Arthur Passos](https://github.com/arthurpassos)).
 * Fix key description when encountering duplicate primary keys. This can happen in projections. See [#45590](https://github.com/ClickHouse/ClickHouse/issues/45590) for details. [#45686](https://github.com/ClickHouse/ClickHouse/pull/45686) ([Amos Bird](https://github.com/amosbird)).
 * Set compression method and level for backup Closes [#45690](https://github.com/ClickHouse/ClickHouse/issues/45690). [#45737](https://github.com/ClickHouse/ClickHouse/pull/45737) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
-* Should use `select_query_typed.limitByOffset()` instead of `select_query_typed.limitOffset()`. [#45817](https://github.com/ClickHouse/ClickHouse/pull/45817) ([刘陶峰](https://github.com/taofengliu)).
+* Should use `select_query_typed.limitByOffset` instead of `select_query_typed.limitOffset`. [#45817](https://github.com/ClickHouse/ClickHouse/pull/45817) ([刘陶峰](https://github.com/taofengliu)).
 * When use experimental analyzer, queries like `SELECT number FROM numbers(100) LIMIT 10 OFFSET 10;` get wrong results (empty result for this sql). That is caused by an unnecessary offset step added by planner. [#45822](https://github.com/ClickHouse/ClickHouse/pull/45822) ([刘陶峰](https://github.com/taofengliu)).
 * Backward compatibility - allow implicit narrowing conversion from UInt64 to IPv4 - required for "INSERT ... VALUES ..." expression. [#45865](https://github.com/ClickHouse/ClickHouse/pull/45865) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
 * Bugfix IPv6 parser for mixed ip4 address with missed first octet (like `::.1.2.3`). [#45871](https://github.com/ClickHouse/ClickHouse/pull/45871) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
diff --git a/LICENSE b/LICENSE
index 65c5df824c6..c653e59a8f3 100644
--- a/LICENSE
+++ b/LICENSE
@@ -1,4 +1,4 @@
-Copyright 2016-2023 ClickHouse, Inc.
+Copyright 2016-2024 ClickHouse, Inc.
 
                                  Apache License
                            Version 2.0, January 2004
@@ -188,7 +188,7 @@ Copyright 2016-2023 ClickHouse, Inc.
       same "printed page" as the copyright notice for easier
       identification within third-party archives.
 
-   Copyright 2016-2023 ClickHouse, Inc.
+   Copyright 2016-2024 ClickHouse, Inc.
 
    Licensed under the Apache License, Version 2.0 (the "License");
    you may not use this file except in compliance with the License.
diff --git a/README.md b/README.md
index bf8ef0b4e98..c56b3c2fd0d 100644
--- a/README.md
+++ b/README.md
@@ -33,12 +33,7 @@ curl https://clickhouse.com/ | sh
 
 ## Upcoming Events
 
-* [**ClickHouse Meetup in Berlin**](https://www.meetup.com/clickhouse-berlin-user-group/events/296488501/) - Nov 30
-* [**ClickHouse Meetup in NYC**](https://www.meetup.com/clickhouse-new-york-user-group/events/296488779/) - Dec 11
-* [**ClickHouse Meetup in Sydney**](https://www.meetup.com/clickhouse-sydney-user-group/events/297638812/) - Dec 12
-* [**ClickHouse Meetup in Boston**](https://www.meetup.com/clickhouse-boston-user-group/events/296488840/) - Dec 12
-
-Also, keep an eye out for upcoming meetups around the world. Somewhere else you want us to be? Please feel free to reach out to tyler <at> clickhouse <dot> com.
+Keep an eye out for upcoming meetups around the world. Somewhere else you want us to be? Please feel free to reach out to tyler <at> clickhouse <dot> com.
 
 ## Recent Recordings
 * **Recent Meetup Videos**: [Meetup Playlist](https://www.youtube.com/playlist?list=PL0Z2YDlm0b3iNDUzpY1S3L_iV4nARda_U) Whenever possible recordings of the ClickHouse Community Meetups are edited and presented as individual talks. Current featuring "Modern SQL in 2023", "Fast, Concurrent, and Consistent Asynchronous INSERTS in ClickHouse", and "Full-Text Indices: Design and Experiments"
diff --git a/SECURITY.md b/SECURITY.md
index 5477628cee4..a200e172a3b 100644
--- a/SECURITY.md
+++ b/SECURITY.md
@@ -13,8 +13,10 @@ The following versions of ClickHouse server are currently being supported with s
 
 | Version | Supported |
 |:-|:-|
+| 23.12 | ✔️ |
+| 23.11 | ✔️ |
 | 23.10 | ✔️ |
-| 23.9 | ✔️ |
+| 23.9 | ❌ |
 | 23.8 | ✔️ |
 | 23.7 | ❌ |
 | 23.6 | ❌ |
diff --git a/base/glibc-compatibility/glibc-compatibility.c b/base/glibc-compatibility/glibc-compatibility.c
index 49bb81a58be..738cda47877 100644
--- a/base/glibc-compatibility/glibc-compatibility.c
+++ b/base/glibc-compatibility/glibc-compatibility.c
@@ -30,7 +30,6 @@ int __gai_sigqueue(int sig, const union sigval val, pid_t caller_pid)
 }
 
 
-#include <sys/select.h>
 #include <stdlib.h>
 #include <features.h>
 
diff --git a/base/poco/Foundation/CMakeLists.txt b/base/poco/Foundation/CMakeLists.txt
index d0dde8a51a5..dfb41a33fb1 100644
--- a/base/poco/Foundation/CMakeLists.txt
+++ b/base/poco/Foundation/CMakeLists.txt
@@ -55,7 +55,6 @@ set (SRCS
     src/DigestStream.cpp
     src/DirectoryIterator.cpp
     src/DirectoryIteratorStrategy.cpp
-    src/DirectoryWatcher.cpp
     src/Environment.cpp
     src/Error.cpp
     src/ErrorHandler.cpp
diff --git a/base/poco/Foundation/include/Poco/DirectoryWatcher.h b/base/poco/Foundation/include/Poco/DirectoryWatcher.h
deleted file mode 100644
index 00964a5512a..00000000000
--- a/base/poco/Foundation/include/Poco/DirectoryWatcher.h
+++ /dev/null
@@ -1,228 +0,0 @@
-//
-// DirectoryWatcher.h
-//
-// Library: Foundation
-// Package: Filesystem
-// Module:  DirectoryWatcher
-//
-// Definition of the DirectoryWatcher class.
-//
-// Copyright (c) 2012, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#ifndef Foundation_DirectoryWatcher_INCLUDED
-#define Foundation_DirectoryWatcher_INCLUDED
-
-
-#include "Poco/Foundation.h"
-
-
-#ifndef POCO_NO_INOTIFY
-
-
-#    include "Poco/AtomicCounter.h"
-#    include "Poco/BasicEvent.h"
-#    include "Poco/File.h"
-#    include "Poco/Runnable.h"
-#    include "Poco/Thread.h"
-
-
-namespace Poco
-{
-
-
-class DirectoryWatcherStrategy;
-
-
-class Foundation_API DirectoryWatcher : protected Runnable
-/// This class is used to get notifications about changes
-/// to the filesystem, more specifically, to a specific
-/// directory. Changes to a directory are reported via
-/// events.
-///
-/// A thread will be created that watches the specified
-/// directory for changes. Events are reported in the context
-/// of this thread.
-///
-/// Note that changes to files in subdirectories of the watched
-/// directory are not reported. Separate DirectoryWatcher objects
-/// must be created for these directories if they should be watched.
-///
-/// Changes to file attributes are not reported.
-///
-/// On Windows, this class is implemented using FindFirstChangeNotification()/FindNextChangeNotification().
-/// On Linux, this class is implemented using inotify.
-/// On FreeBSD and Darwin (Mac OS X, iOS), this class uses kevent/kqueue.
-/// On all other platforms, the watched directory is periodically scanned
-/// for changes. This can negatively affect performance if done too often.
-/// Therefore, the interval in which scans are done can be specified in
-/// the constructor. Note that periodic scanning will also be done on FreeBSD
-/// and Darwin if events for changes to files (DW_ITEM_MODIFIED) are enabled.
-///
-/// DW_ITEM_MOVED_FROM and DW_ITEM_MOVED_TO events will only be reported
-/// on Linux. On other platforms, a file rename or move operation
-/// will be reported via a DW_ITEM_REMOVED and a DW_ITEM_ADDED event.
-/// The order of these two events is not defined.
-///
-/// An event mask can be specified to enable only certain events.
-{
-public:
-    enum DirectoryEventType
-    {
-        DW_ITEM_ADDED = 1,
-        /// A new item has been created and added to the directory.
-
-        DW_ITEM_REMOVED = 2,
-        /// An item has been removed from the directory.
-
-        DW_ITEM_MODIFIED = 4,
-        /// An item has been modified.
-
-        DW_ITEM_MOVED_FROM = 8,
-        /// An item has been renamed or moved. This event delivers the old name.
-
-        DW_ITEM_MOVED_TO = 16
-        /// An item has been renamed or moved. This event delivers the new name.
-    };
-
-    enum DirectoryEventMask
-    {
-        DW_FILTER_ENABLE_ALL = 31,
-        /// Enables all event types.
-
-        DW_FILTER_DISABLE_ALL = 0
-        /// Disables all event types.
-    };
-
-    enum
-    {
-        DW_DEFAULT_SCAN_INTERVAL = 5 /// Default scan interval for platforms that don't provide a native notification mechanism.
-    };
-
-    struct DirectoryEvent
-    {
-        DirectoryEvent(const File & f, DirectoryEventType ev) : item(f), event(ev) { }
-
-        const File & item; /// The directory or file that has been changed.
-        DirectoryEventType event; /// The kind of event.
-    };
-
-    BasicEvent<const DirectoryEvent> itemAdded;
-    /// Fired when a file or directory has been created or added to the directory.
-
-    BasicEvent<const DirectoryEvent> itemRemoved;
-    /// Fired when a file or directory has been removed from the directory.
-
-    BasicEvent<const DirectoryEvent> itemModified;
-    /// Fired when a file or directory has been modified.
-
-    BasicEvent<const DirectoryEvent> itemMovedFrom;
-    /// Fired when a file or directory has been renamed. This event delivers the old name.
-
-    BasicEvent<const DirectoryEvent> itemMovedTo;
-    /// Fired when a file or directory has been moved. This event delivers the new name.
-
-    BasicEvent<const Exception> scanError;
-    /// Fired when an error occurs while scanning for changes.
-
-    DirectoryWatcher(const std::string & path, int eventMask = DW_FILTER_ENABLE_ALL, int scanInterval = DW_DEFAULT_SCAN_INTERVAL);
-    /// Creates a DirectoryWatcher for the directory given in path.
-    /// To enable only specific events, an eventMask can be specified by
-    /// OR-ing the desired event IDs (e.g., DW_ITEM_ADDED | DW_ITEM_MODIFIED).
-    /// On platforms where no native filesystem notifications are available,
-    /// scanInterval specifies the interval in seconds between scans
-    /// of the directory.
-
-    DirectoryWatcher(const File & directory, int eventMask = DW_FILTER_ENABLE_ALL, int scanInterval = DW_DEFAULT_SCAN_INTERVAL);
-    /// Creates a DirectoryWatcher for the specified directory
-    /// To enable only specific events, an eventMask can be specified by
-    /// OR-ing the desired event IDs (e.g., DW_ITEM_ADDED | DW_ITEM_MODIFIED).
-    /// On platforms where no native filesystem notifications are available,
-    /// scanInterval specifies the interval in seconds between scans
-    /// of the directory.
-
-    ~DirectoryWatcher();
-    /// Destroys the DirectoryWatcher.
-
-    void suspendEvents();
-    /// Suspends sending of events. Can be called multiple times, but every
-    /// call to suspendEvent() must be matched by a call to resumeEvents().
-
-    void resumeEvents();
-    /// Resumes events, after they have been suspended with a call to suspendEvents().
-
-    bool eventsSuspended() const;
-    /// Returns true iff events are suspended.
-
-    int eventMask() const;
-    /// Returns the value of the eventMask passed to the constructor.
-
-    int scanInterval() const;
-    /// Returns the scan interval in seconds.
-
-    const File & directory() const;
-    /// Returns the directory being watched.
-
-    bool supportsMoveEvents() const;
-    /// Returns true iff the platform supports DW_ITEM_MOVED_FROM/itemMovedFrom and
-    /// DW_ITEM_MOVED_TO/itemMovedTo events.
-
-protected:
-    void init();
-    void stop();
-    void run();
-
-private:
-    DirectoryWatcher();
-    DirectoryWatcher(const DirectoryWatcher &);
-    DirectoryWatcher & operator=(const DirectoryWatcher &);
-
-    Thread _thread;
-    File _directory;
-    int _eventMask;
-    AtomicCounter _eventsSuspended;
-    int _scanInterval;
-    DirectoryWatcherStrategy * _pStrategy;
-};
-
-
-//
-// inlines
-//
-
-
-inline bool DirectoryWatcher::eventsSuspended() const
-{
-    return _eventsSuspended.value() > 0;
-}
-
-
-inline int DirectoryWatcher::eventMask() const
-{
-    return _eventMask;
-}
-
-
-inline int DirectoryWatcher::scanInterval() const
-{
-    return _scanInterval;
-}
-
-
-inline const File & DirectoryWatcher::directory() const
-{
-    return _directory;
-}
-
-
-} // namespace Poco
-
-
-#endif // POCO_NO_INOTIFY
-
-
-#endif // Foundation_DirectoryWatcher_INCLUDED
diff --git a/base/poco/Foundation/include/Poco/StreamUtil.h b/base/poco/Foundation/include/Poco/StreamUtil.h
index fa1814a0f2e..ed0a4fb5154 100644
--- a/base/poco/Foundation/include/Poco/StreamUtil.h
+++ b/base/poco/Foundation/include/Poco/StreamUtil.h
@@ -69,6 +69,9 @@
 // init() is called in the MyIOS constructor.
 // Therefore we replace each call to init() with
 // the poco_ios_init macro defined below.
+//
+// Also this macro will adjust exceptions() flags, since by default std::ios
+// will hide exceptions, while in ClickHouse it is better to pass them through.
 
 
 #if !defined(POCO_IOS_INIT_HACK)
@@ -79,7 +82,10 @@
 #if defined(POCO_IOS_INIT_HACK)
 #    define poco_ios_init(buf)
 #else
-#    define poco_ios_init(buf) init(buf)
+#    define poco_ios_init(buf) do {                         \
+    init(buf);                                              \
+    this->exceptions(std::ios::failbit | std::ios::badbit); \
+} while (0)
 #endif
 
 
diff --git a/base/poco/Foundation/include/Poco/UTF32Encoding.h b/base/poco/Foundation/include/Poco/UTF32Encoding.h
index e6784e787cc..dafac005e83 100644
--- a/base/poco/Foundation/include/Poco/UTF32Encoding.h
+++ b/base/poco/Foundation/include/Poco/UTF32Encoding.h
@@ -70,6 +70,15 @@ public:
     int queryConvert(const unsigned char * bytes, int length) const;
     int sequenceLength(const unsigned char * bytes, int length) const;
 
+protected:
+	static int safeToInt(Poco::UInt32 value)
+	{
+		if (value <= 0x10FFFF)
+			return static_cast<int>(value);
+		else
+			return -1;
+	}
+
 private:
     bool _flipBytes;
     static const char * _names[];
diff --git a/base/poco/Foundation/src/DirectoryWatcher.cpp b/base/poco/Foundation/src/DirectoryWatcher.cpp
deleted file mode 100644
index b559da65e09..00000000000
--- a/base/poco/Foundation/src/DirectoryWatcher.cpp
+++ /dev/null
@@ -1,602 +0,0 @@
-//
-// DirectoryWatcher.cpp
-//
-// Library: Foundation
-// Package: Filesystem
-// Module:  DirectoryWatcher
-//
-// Copyright (c) 2012, Applied Informatics Software Engineering GmbH.
-// and Contributors.
-//
-// SPDX-License-Identifier:	BSL-1.0
-//
-
-
-#include "Poco/DirectoryWatcher.h"
-
-
-#ifndef POCO_NO_INOTIFY
-
-
-#include "Poco/Path.h"
-#include "Poco/Glob.h"
-#include "Poco/DirectoryIterator.h"
-#include "Poco/Event.h"
-#include "Poco/Exception.h"
-#include "Poco/Buffer.h"
-#if POCO_OS == POCO_OS_LINUX || POCO_OS == POCO_OS_ANDROID
-	#include <sys/inotify.h>
-	#include <sys/select.h>
-	#include <unistd.h>
-#elif POCO_OS == POCO_OS_MAC_OS_X || POCO_OS == POCO_OS_FREE_BSD
-	#include <fcntl.h>
-	#include <sys/types.h>
-	#include <sys/event.h>
-	#include <sys/time.h>
-	#include <unistd.h>
-	#if (POCO_OS == POCO_OS_FREE_BSD) && !defined(O_EVTONLY)
-		#define O_EVTONLY 0x8000
-	#endif
-#endif
-#include <algorithm>
-#include <atomic>
-#include <map>
-
-namespace Poco {
-
-
-class DirectoryWatcherStrategy
-{
-public:
-	DirectoryWatcherStrategy(DirectoryWatcher& owner):
-		_owner(owner)
-	{
-	}
-
-	virtual ~DirectoryWatcherStrategy()
-	{
-	}
-
-	DirectoryWatcher& owner()
-	{
-		return _owner;
-	}
-	
-	virtual void run() = 0;
-	virtual void stop() = 0;
-	virtual bool supportsMoveEvents() const = 0;
-
-protected:
-	struct ItemInfo
-	{
-		ItemInfo():
-			size(0)
-		{
-		}
-		
-		ItemInfo(const ItemInfo& other):
-			path(other.path),
-			size(other.size),
-			lastModified(other.lastModified)
-		{
-		}
-		
-		explicit ItemInfo(const File& f):
-			path(f.path()),
-			size(f.isFile() ? f.getSize() : 0),
-			lastModified(f.getLastModified())
-		{
-		}
-		
-		std::string path;
-		File::FileSize size;
-		Timestamp lastModified;
-	};
-	typedef std::map<std::string, ItemInfo> ItemInfoMap;
-
-	void scan(ItemInfoMap& entries)
-	{
-		DirectoryIterator it(owner().directory());
-		DirectoryIterator end;
-		while (it != end)
-		{
-			entries[it.path().getFileName()] = ItemInfo(*it);
-			++it;
-		}
-	}
-	
-	void compare(ItemInfoMap& oldEntries, ItemInfoMap& newEntries)
-	{
-		for (ItemInfoMap::iterator itn = newEntries.begin(); itn != newEntries.end(); ++itn)
-		{
-			ItemInfoMap::iterator ito = oldEntries.find(itn->first);
-			if (ito != oldEntries.end())
-			{
-				if ((owner().eventMask() & DirectoryWatcher::DW_ITEM_MODIFIED) && !owner().eventsSuspended())
-				{
-					if (itn->second.size != ito->second.size || itn->second.lastModified != ito->second.lastModified)
-					{
-						Poco::File f(itn->second.path);
-						DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_MODIFIED);
-						owner().itemModified(&owner(), ev);
-					}
-				}
-				oldEntries.erase(ito);
-			}
-			else if ((owner().eventMask() & DirectoryWatcher::DW_ITEM_ADDED) && !owner().eventsSuspended())
-			{
-				Poco::File f(itn->second.path);
-				DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_ADDED);
-				owner().itemAdded(&owner(), ev);
-			}
-		}
-		if ((owner().eventMask() & DirectoryWatcher::DW_ITEM_REMOVED) && !owner().eventsSuspended())
-		{
-			for (ItemInfoMap::iterator it = oldEntries.begin(); it != oldEntries.end(); ++it)
-			{
-				Poco::File f(it->second.path);
-				DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_REMOVED);
-				owner().itemRemoved(&owner(), ev);
-			}
-		}
-	}
-
-private:
-	DirectoryWatcherStrategy();
-	DirectoryWatcherStrategy(const DirectoryWatcherStrategy&);
-	DirectoryWatcherStrategy& operator = (const DirectoryWatcherStrategy&);
-	
-	DirectoryWatcher& _owner;
-};
-
-
-#if POCO_OS == POCO_OS_WINDOWS_NT
-
-
-class WindowsDirectoryWatcherStrategy: public DirectoryWatcherStrategy
-{
-public:
-	WindowsDirectoryWatcherStrategy(DirectoryWatcher& owner):
-		DirectoryWatcherStrategy(owner)
-	{
-		_hStopped = CreateEventW(NULL, FALSE, FALSE, NULL);
-		if (!_hStopped)
-			throw SystemException("cannot create event");
-	}
-	
-	~WindowsDirectoryWatcherStrategy()
-	{
-		CloseHandle(_hStopped);
-	}
-	
-	void run()
-	{
-		ItemInfoMap entries;
-		scan(entries);
-		
-		DWORD filter = FILE_NOTIFY_CHANGE_FILE_NAME | FILE_NOTIFY_CHANGE_DIR_NAME;
-		if (owner().eventMask() & DirectoryWatcher::DW_ITEM_MODIFIED)
-			filter |= FILE_NOTIFY_CHANGE_SIZE | FILE_NOTIFY_CHANGE_LAST_WRITE;
-		
-		std::string path(owner().directory().path());
-		HANDLE hChange = FindFirstChangeNotificationA(path.c_str(), FALSE, filter);
-
-		if (hChange == INVALID_HANDLE_VALUE)
-		{
-			try
-			{
-				FileImpl::handleLastErrorImpl(path);
-			}
-			catch (Poco::Exception& exc)
-			{
-				owner().scanError(&owner(), exc);
-			}
-			return;
-		}
-		
-		bool stopped = false;
-		while (!stopped)
-		{
-			try
-			{
-				HANDLE h[2];
-				h[0] = _hStopped;
-				h[1] = hChange;
-				switch (WaitForMultipleObjects(2, h, FALSE, INFINITE))
-				{
-				case WAIT_OBJECT_0:
-					stopped = true;
-					break;
-				case WAIT_OBJECT_0 + 1:
-					{
-						ItemInfoMap newEntries;
-						scan(newEntries);
-						compare(entries, newEntries);
-						std::swap(entries, newEntries);
-						if (FindNextChangeNotification(hChange) == FALSE)
-						{
-							FileImpl::handleLastErrorImpl(path);
-						}
-					}
-					break;
-				default:
-					throw SystemException("failed to wait for directory changes");
-				}
-			}
-			catch (Poco::Exception& exc)
-			{
-				owner().scanError(&owner(), exc);
-			}			
-		}
-		FindCloseChangeNotification(hChange);
-	}
-	
-	void stop()
-	{
-		SetEvent(_hStopped);
-	}
-	
-	bool supportsMoveEvents() const
-	{
-		return false;
-	}
-	
-private:
-	HANDLE _hStopped;
-};
-
-
-#elif POCO_OS == POCO_OS_LINUX || POCO_OS == POCO_OS_ANDROID
-
-
-class LinuxDirectoryWatcherStrategy: public DirectoryWatcherStrategy
-{
-public:
-	LinuxDirectoryWatcherStrategy(DirectoryWatcher& owner):
-		DirectoryWatcherStrategy(owner),
-		_fd(-1),
-		_stopped(false)
-	{
-		_fd = inotify_init();
-		if (_fd == -1) throw Poco::IOException("cannot initialize inotify", errno);
-	}
-	
-	~LinuxDirectoryWatcherStrategy()
-	{
-		close(_fd);
-	}
-	
-	void run()
-	{
-		int mask = 0;
-		if (owner().eventMask() & DirectoryWatcher::DW_ITEM_ADDED)
-			mask |= IN_CREATE;
-		if (owner().eventMask() & DirectoryWatcher::DW_ITEM_REMOVED)
-			mask |= IN_DELETE;
-		if (owner().eventMask() & DirectoryWatcher::DW_ITEM_MODIFIED)
-			mask |= IN_MODIFY;
-		if (owner().eventMask() & DirectoryWatcher::DW_ITEM_MOVED_FROM)
-			mask |= IN_MOVED_FROM;
-		if (owner().eventMask() & DirectoryWatcher::DW_ITEM_MOVED_TO)
-			mask |= IN_MOVED_TO;
-		int wd = inotify_add_watch(_fd, owner().directory().path().c_str(), mask);
-		if (wd == -1)
-		{
-			try
-			{
-				FileImpl::handleLastErrorImpl(owner().directory().path());
-			}
-			catch (Poco::Exception& exc)
-			{
-				owner().scanError(&owner(), exc);
-			}
-		}
-		
-		Poco::Buffer<char> buffer(4096);
-		while (!_stopped.load(std::memory_order_relaxed))
-		{
-			fd_set fds;
-			FD_ZERO(&fds);
-			FD_SET(_fd, &fds);
-
-			struct timeval tv;
-			tv.tv_sec  = 0;
-			tv.tv_usec = 200000;
-
-			if (select(_fd + 1, &fds, NULL, NULL, &tv) == 1)
-			{
-				int n = read(_fd, buffer.begin(), buffer.size());
-				int i = 0;
-				if (n > 0)
-				{
-					while (n > 0)
-					{
-						struct inotify_event* event = reinterpret_cast<struct inotify_event*>(buffer.begin() + i);
-						
-						if (event->len > 0)
-						{						
-							if (!owner().eventsSuspended())
-							{
-								Poco::Path p(owner().directory().path());
-								p.makeDirectory();
-								p.setFileName(event->name);
-								Poco::File f(p.toString());
-	
-								if ((event->mask & IN_CREATE) && (owner().eventMask() & DirectoryWatcher::DW_ITEM_ADDED))
-								{
-									DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_ADDED);
-									owner().itemAdded(&owner(), ev);
-								}
-								if ((event->mask & IN_DELETE) && (owner().eventMask() & DirectoryWatcher::DW_ITEM_REMOVED))
-								{
-									DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_REMOVED);
-									owner().itemRemoved(&owner(), ev);
-								}
-								if ((event->mask & IN_MODIFY) && (owner().eventMask() & DirectoryWatcher::DW_ITEM_MODIFIED))
-								{
-									DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_MODIFIED);
-									owner().itemModified(&owner(), ev);
-								}
-								if ((event->mask & IN_MOVED_FROM) && (owner().eventMask() & DirectoryWatcher::DW_ITEM_MOVED_FROM))
-								{
-									DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_MOVED_FROM);
-									owner().itemMovedFrom(&owner(), ev);
-								}
-								if ((event->mask & IN_MOVED_TO) && (owner().eventMask() & DirectoryWatcher::DW_ITEM_MOVED_TO))
-								{
-									DirectoryWatcher::DirectoryEvent ev(f, DirectoryWatcher::DW_ITEM_MOVED_TO);
-									owner().itemMovedTo(&owner(), ev);
-								}
-							}
-						}
-						
-						i += sizeof(inotify_event) + event->len;
-						n -= sizeof(inotify_event) + event->len;
-					}
-				}
-			}
-		}
-	}
-	
-	void stop()
-	{
-		_stopped.store(true, std::memory_order_relaxed);
-	}
-	
-	bool supportsMoveEvents() const
-	{
-		return true;
-	}
-
-private:
-	int _fd;
-	std::atomic<bool> _stopped;
-};
-
-
-#elif POCO_OS == POCO_OS_MAC_OS_X || POCO_OS == POCO_OS_FREE_BSD
-
-
-class BSDDirectoryWatcherStrategy: public DirectoryWatcherStrategy
-{
-public:
-	BSDDirectoryWatcherStrategy(DirectoryWatcher& owner):
-		DirectoryWatcherStrategy(owner),
-		_queueFD(-1),
-		_dirFD(-1),
-		_stopped(false)
-	{
-		_dirFD = open(owner.directory().path().c_str(), O_EVTONLY);
-		if (_dirFD < 0) throw Poco::FileNotFoundException(owner.directory().path());
-		_queueFD = kqueue();
-		if (_queueFD < 0)
-		{
-			close(_dirFD);
-			throw Poco::SystemException("Cannot create kqueue", errno);
-		}
-	}
-
-	~BSDDirectoryWatcherStrategy()
-	{
-		close(_dirFD);
-		close(_queueFD);
-	}
-
-	void run()
-	{
-		Poco::Timestamp lastScan;
-		ItemInfoMap entries;
-		scan(entries);
-
-		while (!_stopped.load(std::memory_order_relaxed))
-		{
-			struct timespec timeout;
-			timeout.tv_sec = 0;
-			timeout.tv_nsec = 200000000;
-			unsigned eventFilter = NOTE_WRITE;
-			struct kevent event;
-			struct kevent eventData;
-			EV_SET(&event, _dirFD, EVFILT_VNODE, EV_ADD | EV_CLEAR, eventFilter, 0, 0);
-			int nEvents = kevent(_queueFD, &event, 1, &eventData, 1, &timeout);
-			if (nEvents < 0 || eventData.flags == EV_ERROR)
-			{
-				try
-				{
-					FileImpl::handleLastErrorImpl(owner().directory().path());
-				}
-				catch (Poco::Exception& exc)
-				{
-					owner().scanError(&owner(), exc);
-				}
-			}
-			else if (nEvents > 0 || ((owner().eventMask() & DirectoryWatcher::DW_ITEM_MODIFIED) && lastScan.isElapsed(owner().scanInterval()*1000000)))
-			{
-				ItemInfoMap newEntries;
-				scan(newEntries);
-				compare(entries, newEntries);
-				std::swap(entries, newEntries);
-				lastScan.update();
-			}
-		}
-	}
-
-	void stop()
-	{
-		_stopped.store(true, std::memory_order_relaxed);
-	}
-
-	bool supportsMoveEvents() const
-	{
-		return false;
-	}
-
-private:
-	int _queueFD;
-	int _dirFD;
-	std::atomic<bool> _stopped;
-};
-
-
-#else
-
-
-class PollingDirectoryWatcherStrategy: public DirectoryWatcherStrategy
-{
-public:
-	PollingDirectoryWatcherStrategy(DirectoryWatcher& owner):
-		DirectoryWatcherStrategy(owner)
-	{
-	}
-	
-	~PollingDirectoryWatcherStrategy()
-	{
-	}
-	
-	void run()
-	{
-		ItemInfoMap entries;
-		scan(entries);
-		while (!_stopped.tryWait(1000*owner().scanInterval()))
-		{
-			try
-			{
-				ItemInfoMap newEntries;
-				scan(newEntries);
-				compare(entries, newEntries);
-				std::swap(entries, newEntries);
-			}
-			catch (Poco::Exception& exc)
-			{
-				owner().scanError(&owner(), exc);
-			}
-		}
-	}
-	
-	void stop()
-	{
-		_stopped.set();
-	}
-
-	bool supportsMoveEvents() const
-	{
-		return false;
-	}
-
-private:
-	Poco::Event _stopped;
-};
-
-
-#endif
-
-
-DirectoryWatcher::DirectoryWatcher(const std::string& path, int eventMask, int scanInterval):
-	_directory(path),
-	_eventMask(eventMask),
-	_scanInterval(scanInterval)
-{
-	init();
-}
-
-	
-DirectoryWatcher::DirectoryWatcher(const Poco::File& directory, int eventMask, int scanInterval):
-	_directory(directory),
-	_eventMask(eventMask),
-	_scanInterval(scanInterval)
-{
-	init();
-}
-
-
-DirectoryWatcher::~DirectoryWatcher()
-{
-	try
-	{
-		stop();
-		delete _pStrategy;
-	}
-	catch (...)
-	{
-		poco_unexpected();
-	}
-}
-
-	
-void DirectoryWatcher::suspendEvents()
-{
-	poco_assert (_eventsSuspended > 0);
-	
-	_eventsSuspended--;
-}
-
-
-void DirectoryWatcher::resumeEvents()
-{
-	_eventsSuspended++;
-}
-
-
-void DirectoryWatcher::init()
-{
-	if (!_directory.exists())
-		throw Poco::FileNotFoundException(_directory.path());
-		
-	if (!_directory.isDirectory())
-		throw Poco::InvalidArgumentException("not a directory", _directory.path());
-
-#if POCO_OS == POCO_OS_WINDOWS_NT
-	_pStrategy = new WindowsDirectoryWatcherStrategy(*this);
-#elif POCO_OS == POCO_OS_LINUX || POCO_OS == POCO_OS_ANDROID
-	_pStrategy = new LinuxDirectoryWatcherStrategy(*this);
-#elif POCO_OS == POCO_OS_MAC_OS_X || POCO_OS == POCO_OS_FREE_BSD
-	_pStrategy = new BSDDirectoryWatcherStrategy(*this);
-#else
-	_pStrategy = new PollingDirectoryWatcherStrategy(*this);
-#endif
-	_thread.start(*this);
-}
-
-	
-void DirectoryWatcher::run()
-{
-	_pStrategy->run();
-}
-
-
-void DirectoryWatcher::stop()
-{
-	_pStrategy->stop();
-	_thread.join();
-}
-
-
-bool DirectoryWatcher::supportsMoveEvents() const
-{
-	return _pStrategy->supportsMoveEvents();
-}
-
-
-} // namespace Poco
-
-
-#endif // POCO_NO_INOTIFY
diff --git a/base/poco/Foundation/src/UTF32Encoding.cpp b/base/poco/Foundation/src/UTF32Encoding.cpp
index ff07006a4fb..e600c5d9445 100644
--- a/base/poco/Foundation/src/UTF32Encoding.cpp
+++ b/base/poco/Foundation/src/UTF32Encoding.cpp
@@ -30,22 +30,22 @@ const char* UTF32Encoding::_names[] =
 
 const TextEncoding::CharacterMap UTF32Encoding::_charMap = 
 {
-	/* 00 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 10 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 20 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 30 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 40 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 50 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 60 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 70 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 80 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* 90 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* a0 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* b0 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* c0 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* d0 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* e0 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
-	/* f0 */	-2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, -2, 
+	/* 00 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 10 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 20 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 30 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 40 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 50 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 60 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 70 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 80 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* 90 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* a0 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* b0 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* c0 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* d0 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* e0 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
+	/* f0 */	-4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4, -4,
 };
 
 
@@ -118,7 +118,7 @@ const TextEncoding::CharacterMap& UTF32Encoding::characterMap() const
 int UTF32Encoding::convert(const unsigned char* bytes) const
 {
 	UInt32 uc;
-	unsigned char* p = (unsigned char*) &uc;
+	unsigned char* p = reinterpret_cast<unsigned char*>(&uc);
 	*p++ = *bytes++;
 	*p++ = *bytes++;
 	*p++ = *bytes++;
@@ -129,7 +129,7 @@ int UTF32Encoding::convert(const unsigned char* bytes) const
 		ByteOrder::flipBytes(uc);
 	}
 
-	return uc;
+	return safeToInt(uc);
 }
 
 
@@ -138,7 +138,7 @@ int UTF32Encoding::convert(int ch, unsigned char* bytes, int length) const
 	if (bytes && length >= 4)
 	{
 		UInt32 ch1 = _flipBytes ? ByteOrder::flipBytes((UInt32) ch) : (UInt32) ch;
-		unsigned char* p = (unsigned char*) &ch1;
+		unsigned char* p = reinterpret_cast<unsigned char*>(&ch1);
 		*bytes++ = *p++;
 		*bytes++ = *p++;
 		*bytes++ = *p++;
@@ -155,14 +155,14 @@ int UTF32Encoding::queryConvert(const unsigned char* bytes, int length) const
 	if (length >= 4)
 	{
 		UInt32 uc;
-		unsigned char* p = (unsigned char*) &uc;
+		unsigned char* p = reinterpret_cast<unsigned char*>(&uc);
 		*p++ = *bytes++;
 		*p++ = *bytes++;
 		*p++ = *bytes++;
 		*p++ = *bytes++;
 		if (_flipBytes) 
 			ByteOrder::flipBytes(uc);
-		return uc;
+		ret = safeToInt(uc);
 	}
 
 	return ret;
diff --git a/base/poco/Util/src/XMLConfiguration.cpp b/base/poco/Util/src/XMLConfiguration.cpp
index e0d363cc870..648084aa28e 100644
--- a/base/poco/Util/src/XMLConfiguration.cpp
+++ b/base/poco/Util/src/XMLConfiguration.cpp
@@ -18,6 +18,7 @@
 #ifndef POCO_UTIL_NO_XMLCONFIGURATION
 
 
+#include "Poco/String.h"
 #include "Poco/SAX/InputSource.h"
 #include "Poco/DOM/DOMParser.h"
 #include "Poco/DOM/Element.h"
@@ -28,6 +29,8 @@
 #include "Poco/NumberParser.h"
 #include "Poco/NumberFormatter.h"
 #include <unordered_map>
+#include <algorithm>
+#include <iterator>
 
 
 namespace Poco {
@@ -275,8 +278,9 @@ void XMLConfiguration::enumerate(const std::string& key, Keys& range) const
 		{
 			if (pChild->nodeType() == Poco::XML::Node::ELEMENT_NODE)
 			{
-				const std::string& nodeName = pChild->nodeName();
+				std::string nodeName = pChild->nodeName();
 				size_t& count = keys[nodeName];
+				replaceInPlace(nodeName, ".", "\\.");
 				if (count)
 					range.push_back(nodeName + "[" + NumberFormatter::format(count) + "]");
 				else
@@ -379,7 +383,21 @@ Poco::XML::Node* XMLConfiguration::findNode(std::string::const_iterator& it, con
 		{
 			while (it != end && *it == _delim) ++it;
 			std::string key;
-			while (it != end && *it != _delim && *it != '[') key += *it++;
+			while (it != end)
+			{
+				if (*it == '\\' && std::distance(it, end) > 1)
+				{
+					// Skip backslash, copy only the char after it
+					std::advance(it, 1);
+					key += *it++;
+					continue;
+				}
+				if (*it == _delim)
+					break;
+				if (*it == '[')
+					break;
+				key += *it++;
+			}
 			return findNode(it, end, findElement(key, pNode, create), create);
 		}
 	}
diff --git a/cmake/autogenerated_versions.txt b/cmake/autogenerated_versions.txt
index 1e0a82a1403..e5a8c064808 100644
--- a/cmake/autogenerated_versions.txt
+++ b/cmake/autogenerated_versions.txt
@@ -2,11 +2,11 @@
 
 # NOTE: has nothing common with DBMS_TCP_PROTOCOL_VERSION,
 # only DBMS_TCP_PROTOCOL_VERSION should be incremented on protocol changes.
-SET(VERSION_REVISION 54480)
-SET(VERSION_MAJOR 23)
-SET(VERSION_MINOR 11)
+SET(VERSION_REVISION 54482)
+SET(VERSION_MAJOR 24)
+SET(VERSION_MINOR 1)
 SET(VERSION_PATCH 1)
-SET(VERSION_GITHASH 13adae0e42fd48de600486fc5d4b64d39f80c43e)
-SET(VERSION_DESCRIBE v23.11.1.1-testing)
-SET(VERSION_STRING 23.11.1.1)
+SET(VERSION_GITHASH a2faa65b080a587026c86844f3a20c74d23a86f8)
+SET(VERSION_DESCRIBE v24.1.1.1-testing)
+SET(VERSION_STRING 24.1.1.1)
 # end of autochange
diff --git a/cmake/target.cmake b/cmake/target.cmake
index 887f79bf24e..fb911ace7b5 100644
--- a/cmake/target.cmake
+++ b/cmake/target.cmake
@@ -12,6 +12,8 @@ elseif (CMAKE_SYSTEM_NAME MATCHES "FreeBSD")
 elseif (CMAKE_SYSTEM_NAME MATCHES "Darwin")
     set (OS_DARWIN 1)
     add_definitions(-D OS_DARWIN)
+    # For MAP_ANON/MAP_ANONYMOUS
+    add_definitions(-D _DARWIN_C_SOURCE)
 elseif (CMAKE_SYSTEM_NAME MATCHES "SunOS")
     set (OS_SUNOS 1)
     add_definitions(-D OS_SUNOS)
@@ -42,10 +44,8 @@ if (CMAKE_CROSSCOMPILING)
         if (ARCH_AARCH64)
             # FIXME: broken dependencies
             set (ENABLE_GRPC OFF CACHE INTERNAL "")
-            set (ENABLE_SENTRY OFF CACHE INTERNAL "")
         elseif (ARCH_PPC64LE)
             set (ENABLE_GRPC OFF CACHE INTERNAL "")
-            set (ENABLE_SENTRY OFF CACHE INTERNAL "")
         elseif (ARCH_RISCV64)
             # RISC-V support is preliminary
             set (GLIBC_COMPATIBILITY OFF CACHE INTERNAL "")
@@ -73,19 +73,5 @@ if (CMAKE_CROSSCOMPILING)
         message (FATAL_ERROR "Trying to cross-compile to unsupported system: ${CMAKE_SYSTEM_NAME}!")
     endif ()
 
-    if (USE_MUSL)
-        # use of undeclared identifier 'PTHREAD_RECURSIVE_MUTEX_INITIALIZER_NP'
-        set (ENABLE_SENTRY OFF CACHE INTERNAL "")
-        set (ENABLE_ODBC OFF CACHE INTERNAL "")
-        set (ENABLE_GRPC OFF CACHE INTERNAL "")
-        set (ENABLE_HDFS OFF CACHE INTERNAL "")
-        set (ENABLE_EMBEDDED_COMPILER OFF CACHE INTERNAL "")
-        # use of drand48_data
-        set (ENABLE_AZURE_BLOB_STORAGE OFF CACHE INTERNAL "")
-    endif ()
-
-    # Don't know why but CXX_STANDARD doesn't work for cross-compilation
-    set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -std=c++20")
-
     message (STATUS "Cross-compiling for target: ${CMAKE_CXX_COMPILE_TARGET}")
 endif ()
diff --git a/contrib/CMakeLists.txt b/contrib/CMakeLists.txt
index 3d3b9b72faf..1b5ba15187f 100644
--- a/contrib/CMakeLists.txt
+++ b/contrib/CMakeLists.txt
@@ -135,9 +135,9 @@ add_contrib (libuv-cmake libuv)
 add_contrib (liburing-cmake liburing)
 add_contrib (amqpcpp-cmake AMQP-CPP) # requires: libuv
 add_contrib (cassandra-cmake cassandra) # requires: libuv
+add_contrib (curl-cmake curl)
+add_contrib (azure-cmake azure) # requires: curl
 if (NOT OS_DARWIN)
-    add_contrib (curl-cmake curl)
-    add_contrib (azure-cmake azure) # requires: curl
     add_contrib (sentry-native-cmake sentry-native) # requires: curl
 endif()
 add_contrib (fmtlib-cmake fmtlib)
diff --git a/contrib/azure b/contrib/azure
index 096049bf24f..060c54dfb0a 160000
--- a/contrib/azure
+++ b/contrib/azure
@@ -1 +1 @@
-Subproject commit 096049bf24fffafcaccc132b9367694532716731
+Subproject commit 060c54dfb0abe869c065143303a9d3e9c54c29e3
diff --git a/contrib/azure-cmake/CMakeLists.txt b/contrib/azure-cmake/CMakeLists.txt
index bb44c993e79..0d2512c9e6e 100644
--- a/contrib/azure-cmake/CMakeLists.txt
+++ b/contrib/azure-cmake/CMakeLists.txt
@@ -8,37 +8,21 @@ endif()
 set(AZURE_DIR "${ClickHouse_SOURCE_DIR}/contrib/azure")
 set(AZURE_SDK_LIBRARY_DIR "${AZURE_DIR}/sdk")
 
-file(GLOB AZURE_SDK_CORE_SRC
+file(GLOB AZURE_SDK_SRC
     "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/*.cpp"
     "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/cryptography/*.cpp"
     "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/http/*.cpp"
-    "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/http/curl/*.hpp"
     "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/http/curl/*.cpp"
-    "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/winhttp/*.cpp"
     "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/io/*.cpp"
-    "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/private/*.hpp"
-)
-
-file(GLOB AZURE_SDK_IDENTITY_SRC
+    "${AZURE_SDK_LIBRARY_DIR}/core/azure-core/src/tracing/*.cpp"
     "${AZURE_SDK_LIBRARY_DIR}/identity/azure-identity/src/*.cpp"
-    "${AZURE_SDK_LIBRARY_DIR}/identity/azure-identity/src/private/*.hpp"
-)
-
-file(GLOB AZURE_SDK_STORAGE_COMMON_SRC
-    "${AZURE_SDK_LIBRARY_DIR}/storage/azure-storage-common/src/*.cpp"
-    "${AZURE_SDK_LIBRARY_DIR}/storage/azure-storage-common/src/private/*.cpp"
-)
-
-file(GLOB AZURE_SDK_STORAGE_BLOBS_SRC
     "${AZURE_SDK_LIBRARY_DIR}/storage/azure-storage-blobs/src/*.cpp"
-    "${AZURE_SDK_LIBRARY_DIR}/storage/azure-storage-blobs/src/private/*.hpp"
+    "${AZURE_SDK_LIBRARY_DIR}/storage/azure-storage-blobs/src/private/*.cpp"
+    "${AZURE_SDK_LIBRARY_DIR}/storage/azure-storage-common/src/*.cpp"
 )
 
 file(GLOB AZURE_SDK_UNIFIED_SRC
-    ${AZURE_SDK_CORE_SRC}
-    ${AZURE_SDK_IDENTITY_SRC}
-    ${AZURE_SDK_STORAGE_COMMON_SRC}
-    ${AZURE_SDK_STORAGE_BLOBS_SRC}
+    ${AZURE_SDK_SRC}
 )
 
 set(AZURE_SDK_INCLUDES
diff --git a/contrib/boringssl b/contrib/boringssl
index 8061ac62d67..aa6d2f865a2 160000
--- a/contrib/boringssl
+++ b/contrib/boringssl
@@ -1 +1 @@
-Subproject commit 8061ac62d67953e61b793042e33baf1352e67510
+Subproject commit aa6d2f865a2eab01cf94f197e11e36b6de47b5b4
diff --git a/contrib/curl-cmake/CMakeLists.txt b/contrib/curl-cmake/CMakeLists.txt
index 7e86352befc..e74629e57b3 100644
--- a/contrib/curl-cmake/CMakeLists.txt
+++ b/contrib/curl-cmake/CMakeLists.txt
@@ -10,7 +10,7 @@ set (LIBRARY_DIR "${ClickHouse_SOURCE_DIR}/contrib/curl")
 set (SRCS
     "${LIBRARY_DIR}/lib/altsvc.c"
     "${LIBRARY_DIR}/lib/amigaos.c"
-    "${LIBRARY_DIR}/lib/asyn-thread.c"
+    "${LIBRARY_DIR}/lib/asyn-ares.c"
     "${LIBRARY_DIR}/lib/base64.c"
     "${LIBRARY_DIR}/lib/bufq.c"
     "${LIBRARY_DIR}/lib/bufref.c"
@@ -165,13 +165,14 @@ target_compile_definitions (_curl PRIVATE
     libcurl_EXPORTS
     OS="${CMAKE_SYSTEM_NAME}"
 )
+
 target_include_directories (_curl SYSTEM PUBLIC
     "${LIBRARY_DIR}/include"
     "${LIBRARY_DIR}/lib"
     . # curl_config.h
 )
 
-target_link_libraries (_curl PRIVATE OpenSSL::SSL)
+target_link_libraries (_curl PRIVATE OpenSSL::SSL ch_contrib::c-ares)
 
 # The library is large - avoid bloat (XXX: is it?)
 if (OMIT_HEAVY_DEBUG_SYMBOLS)
diff --git a/contrib/curl-cmake/curl_config.h b/contrib/curl-cmake/curl_config.h
index f56ba3eccd5..a38aa60fe6d 100644
--- a/contrib/curl-cmake/curl_config.h
+++ b/contrib/curl-cmake/curl_config.h
@@ -50,3 +50,4 @@
 #define ENABLE_IPV6
 #define USE_OPENSSL
 #define USE_THREADS_POSIX
+#define USE_ARES
diff --git a/contrib/libhdfs3 b/contrib/libhdfs3
index bdcb91354b1..b9598e60167 160000
--- a/contrib/libhdfs3
+++ b/contrib/libhdfs3
@@ -1 +1 @@
-Subproject commit bdcb91354b1c05b21e73043a112a6f1e3b013497
+Subproject commit b9598e6016720a7c088bfe85ce1fa0410f9d2103
diff --git a/contrib/libhdfs3-cmake/CMakeLists.txt b/contrib/libhdfs3-cmake/CMakeLists.txt
index 4278575fd7f..8cd951af746 100644
--- a/contrib/libhdfs3-cmake/CMakeLists.txt
+++ b/contrib/libhdfs3-cmake/CMakeLists.txt
@@ -26,6 +26,11 @@ ADD_DEFINITIONS(-D__STDC_FORMAT_MACROS)
 ADD_DEFINITIONS(-D_GNU_SOURCE)
 ADD_DEFINITIONS(-D_GLIBCXX_USE_NANOSLEEP)
 ADD_DEFINITIONS(-DHAVE_NANOSLEEP)
+
+if (USE_MUSL)
+    ADD_DEFINITIONS(-DSTRERROR_R_RETURN_INT)
+endif ()
+
 set(HAVE_STEADY_CLOCK 1)
 set(HAVE_NESTED_EXCEPTION 1)
 SET(HAVE_BOOST_CHRONO 0)
diff --git a/contrib/librdkafka b/contrib/librdkafka
index 6f3b483426a..2d2aab6f5b7 160000
--- a/contrib/librdkafka
+++ b/contrib/librdkafka
@@ -1 +1 @@
-Subproject commit 6f3b483426a8c8ec950e27e446bec175cf8b553f
+Subproject commit 2d2aab6f5b79db1cfca15d7bf0dee75d00d82082
diff --git a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
index 9eabfaa50c8..c2faeb47cb1 100644
--- a/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
+++ b/contrib/libxml2-cmake/linux_x86_64/include/libxml/xmlversion.h
@@ -270,7 +270,7 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
  *
  * Whether iconv support is available
  */
-#if 1
+#if 0
 #define LIBXML_ICONV_ENABLED
 #endif
 
@@ -499,5 +499,3 @@ XMLPUBFUN void XMLCALL xmlCheckVersion(int version);
 }
 #endif /* __cplusplus */
 #endif
-
-
diff --git a/contrib/llvm-project b/contrib/llvm-project
index e7b8befca85..1834e42289c 160000
--- a/contrib/llvm-project
+++ b/contrib/llvm-project
@@ -1 +1 @@
-Subproject commit e7b8befca85c8b847614432dba250c22d35fbae0
+Subproject commit 1834e42289c58402c804a87be4d489892b88f3ec
diff --git a/contrib/llvm-project-cmake/CMakeLists.txt b/contrib/llvm-project-cmake/CMakeLists.txt
index 406bac73e90..d09060912d8 100644
--- a/contrib/llvm-project-cmake/CMakeLists.txt
+++ b/contrib/llvm-project-cmake/CMakeLists.txt
@@ -11,7 +11,9 @@ option (ENABLE_EMBEDDED_COMPILER "Enable support for JIT compilation during quer
 
 option (ENABLE_DWARF_PARSER "Enable support for DWARF input format (uses LLVM library)" ${ENABLE_DWARF_PARSER_DEFAULT})
 
-if (NOT ENABLE_EMBEDDED_COMPILER AND NOT ENABLE_DWARF_PARSER)
+option (ENABLE_BLAKE3 "Enable BLAKE3 function" ${ENABLE_LIBRARIES})
+
+if (NOT ENABLE_EMBEDDED_COMPILER AND NOT ENABLE_DWARF_PARSER AND NOT ENABLE_BLAKE3)
     message(STATUS "Not using LLVM")
     return()
 endif()
@@ -26,61 +28,75 @@ set (LLVM_LIBRARY_DIRS "${ClickHouse_BINARY_DIR}/contrib/llvm-project/llvm")
 # and llvm cannot be compiled with bundled libcxx and 20 standard.
 set (CMAKE_CXX_STANDARD 14)
 
-# This list was generated by listing all LLVM libraries, compiling the binary and removing all libraries while it still compiles.
-set (REQUIRED_LLVM_LIBRARIES
-    LLVMExecutionEngine
-    LLVMRuntimeDyld
-    LLVMAsmPrinter
-    LLVMDebugInfoDWARF
-    LLVMGlobalISel
-    LLVMSelectionDAG
-    LLVMMCDisassembler
-    LLVMPasses
-    LLVMCodeGen
-    LLVMipo
-    LLVMBitWriter
-    LLVMInstrumentation
-    LLVMScalarOpts
-    LLVMAggressiveInstCombine
-    LLVMInstCombine
-    LLVMVectorize
-    LLVMTransformUtils
-    LLVMTarget
-    LLVMAnalysis
-    LLVMProfileData
-    LLVMObject
-    LLVMBitReader
-    LLVMCore
-    LLVMRemarks
-    LLVMBitstreamReader
-    LLVMMCParser
-    LLVMMC
-    LLVMBinaryFormat
-    LLVMDebugInfoCodeView
-    LLVMSupport
-    LLVMDemangle
-)
+if (ARCH_AMD64)
+    set (LLVM_TARGETS_TO_BUILD "X86" CACHE INTERNAL "")
+elseif (ARCH_AARCH64)
+    set (LLVM_TARGETS_TO_BUILD "AArch64" CACHE INTERNAL "")
+elseif (ARCH_PPC64LE)
+    set (LLVM_TARGETS_TO_BUILD "PowerPC" CACHE INTERNAL "")
+elseif (ARCH_S390X)
+    set (LLVM_TARGETS_TO_BUILD "SystemZ" CACHE INTERNAL "")
+elseif (ARCH_RISCV64)
+    set (LLVM_TARGETS_TO_BUILD "RISCV" CACHE INTERNAL "")
+endif ()
+
+
+if (NOT ENABLE_EMBEDDED_COMPILER AND NOT ENABLE_DWARF_PARSER)
+    # Only compiling blake3
+    set (REQUIRED_LLVM_LIBRARIES LLVMSupport)
+else()
+    # This list was generated by listing all LLVM libraries, compiling the binary and removing all libraries while it still compiles.
+    set (REQUIRED_LLVM_LIBRARIES
+        LLVMExecutionEngine
+        LLVMRuntimeDyld
+        LLVMAsmPrinter
+        LLVMDebugInfoDWARF
+        LLVMGlobalISel
+        LLVMSelectionDAG
+        LLVMMCDisassembler
+        LLVMPasses
+        LLVMCodeGen
+        LLVMipo
+        LLVMBitWriter
+        LLVMInstrumentation
+        LLVMScalarOpts
+        LLVMAggressiveInstCombine
+        LLVMInstCombine
+        LLVMVectorize
+        LLVMTransformUtils
+        LLVMTarget
+        LLVMAnalysis
+        LLVMProfileData
+        LLVMObject
+        LLVMBitReader
+        LLVMCore
+        LLVMRemarks
+        LLVMBitstreamReader
+        LLVMMCParser
+        LLVMMC
+        LLVMBinaryFormat
+        LLVMDebugInfoCodeView
+        LLVMSupport
+        LLVMDemangle
+    )
+
+    if (ARCH_AMD64)
+        list(APPEND REQUIRED_LLVM_LIBRARIES LLVMX86Info LLVMX86Desc LLVMX86CodeGen)
+    elseif (ARCH_AARCH64)
+        list(APPEND REQUIRED_LLVM_LIBRARIES LLVMAArch64Info LLVMAArch64Desc LLVMAArch64CodeGen)
+    elseif (ARCH_PPC64LE)
+        list(APPEND REQUIRED_LLVM_LIBRARIES LLVMPowerPCInfo LLVMPowerPCDesc LLVMPowerPCCodeGen)
+    elseif (ARCH_S390X)
+        list(APPEND REQUIRED_LLVM_LIBRARIES LLVMSystemZInfo LLVMSystemZDesc LLVMSystemZCodeGen)
+    elseif (ARCH_RISCV64)
+        list(APPEND REQUIRED_LLVM_LIBRARIES LLVMRISCVInfo LLVMRISCVDesc LLVMRISCVCodeGen)
+    endif ()
+endif()
+
 
 # Skip useless "install" instructions from CMake:
 set (LLVM_INSTALL_TOOLCHAIN_ONLY 1 CACHE INTERNAL "")
 
-if (ARCH_AMD64)
-    set (LLVM_TARGETS_TO_BUILD "X86" CACHE INTERNAL "")
-    list(APPEND REQUIRED_LLVM_LIBRARIES LLVMX86Info LLVMX86Desc LLVMX86CodeGen)
-elseif (ARCH_AARCH64)
-    set (LLVM_TARGETS_TO_BUILD "AArch64" CACHE INTERNAL "")
-    list(APPEND REQUIRED_LLVM_LIBRARIES LLVMAArch64Info LLVMAArch64Desc LLVMAArch64CodeGen)
-elseif (ARCH_PPC64LE)
-    set (LLVM_TARGETS_TO_BUILD "PowerPC" CACHE INTERNAL "")
-    list(APPEND REQUIRED_LLVM_LIBRARIES LLVMPowerPCInfo LLVMPowerPCDesc LLVMPowerPCCodeGen)
-elseif (ARCH_S390X)
-    set (LLVM_TARGETS_TO_BUILD "SystemZ" CACHE INTERNAL "")
-    list(APPEND REQUIRED_LLVM_LIBRARIES LLVMSystemZInfo LLVMSystemZDesc LLVMSystemZCodeGen)
-elseif (ARCH_RISCV64)
-    set (LLVM_TARGETS_TO_BUILD "RISCV" CACHE INTERNAL "")
-    list(APPEND REQUIRED_LLVM_LIBRARIES LLVMRISCVInfo LLVMRISCVDesc LLVMRISCVCodeGen)
-endif ()
-
 message (STATUS "LLVM TARGETS TO BUILD ${LLVM_TARGETS_TO_BUILD}")
 
 set (CMAKE_INSTALL_RPATH "ON") # Do not adjust RPATH in llvm, since then it will not be able to find libcxx/libcxxabi/libunwind
diff --git a/contrib/mariadb-connector-c-cmake/CMakeLists.txt b/contrib/mariadb-connector-c-cmake/CMakeLists.txt
index 18d1510a57b..4257828890f 100644
--- a/contrib/mariadb-connector-c-cmake/CMakeLists.txt
+++ b/contrib/mariadb-connector-c-cmake/CMakeLists.txt
@@ -1,4 +1,4 @@
-if(OS_LINUX AND TARGET OpenSSL::SSL)
+if((OS_LINUX OR OS_DARWIN) AND TARGET OpenSSL::SSL)
     option(ENABLE_MYSQL "Enable MySQL" ${ENABLE_LIBRARIES})
 else ()
     option(ENABLE_MYSQL "Enable MySQL" FALSE)
@@ -73,7 +73,7 @@ set(HAVE_SYS_TYPES_H 1)
 set(HAVE_SYS_UN_H 1)
 set(HAVE_UNISTD_H 1)
 set(HAVE_UTIME_H 1)
-set(HAVE_UCONTEXT_H 1)
+set(HAVE_UCONTEXT_H 0)
 set(HAVE_ALLOCA 1)
 set(HAVE_DLERROR 0)
 set(HAVE_DLOPEN 0)
@@ -116,9 +116,13 @@ CONFIGURE_FILE(${CC_SOURCE_DIR}/include/ma_config.h.in
 CONFIGURE_FILE(${CC_SOURCE_DIR}/include/mariadb_version.h.in
                ${CC_BINARY_DIR}/include-public/mariadb_version.h)
 
-if(WITH_SSL)
+if (WITH_SSL)
   set(SYSTEM_LIBS ${SYSTEM_LIBS} ${SSL_LIBRARIES})
-endif()
+endif ()
+
+if (OS_DARWIN)
+  set(SYSTEM_LIBS ${SYSTEM_LIBS} iconv)
+endif ()
 
 
 function(REGISTER_PLUGIN)
@@ -227,15 +231,8 @@ ${CC_SOURCE_DIR}/libmariadb/secure/openssl_crypt.c
 ${CC_BINARY_DIR}/libmariadb/ma_client_plugin.c
 )
 
-if(ICONV_INCLUDE_DIR)
-   include_directories(BEFORE ${ICONV_INCLUDE_DIR})
-endif()
 add_definitions(-DLIBICONV_PLUG)
 
-if(WITH_DYNCOL)
-  set(LIBMARIADB_SOURCES ${LIBMARIADB_SOURCES} ${CC_SOURCE_DIR}/libmariadb/mariadb_dyncol.c)
-endif()
-
 set(LIBMARIADB_SOURCES ${LIBMARIADB_SOURCES} ${CC_SOURCE_DIR}/libmariadb/mariadb_async.c ${CC_SOURCE_DIR}/libmariadb/ma_context.c)
 
 
diff --git a/contrib/rocksdb-cmake/CMakeLists.txt b/contrib/rocksdb-cmake/CMakeLists.txt
index 7d7666dff87..c4220ba90ac 100644
--- a/contrib/rocksdb-cmake/CMakeLists.txt
+++ b/contrib/rocksdb-cmake/CMakeLists.txt
@@ -117,7 +117,7 @@ endif()
 
 add_definitions(-DROCKSDB_PLATFORM_POSIX -DROCKSDB_LIB_IO_POSIX)
 
-if (OS_LINUX OR OS_FREEBSD)
+if ((OS_LINUX OR OS_FREEBSD) AND NOT USE_MUSL)
   add_definitions(-DROCKSDB_PTHREAD_ADAPTIVE_MUTEX)
 endif()
 
diff --git a/contrib/sentry-native b/contrib/sentry-native
index ae10fb8c224..bc359f86cbf 160000
--- a/contrib/sentry-native
+++ b/contrib/sentry-native
@@ -1 +1 @@
-Subproject commit ae10fb8c224c3f41571446e1ed7fd57b9e5e366b
+Subproject commit bc359f86cbf0f73f6fd4b6bfb4ede0c1f8c9400f
diff --git a/contrib/sentry-native-cmake/CMakeLists.txt b/contrib/sentry-native-cmake/CMakeLists.txt
index 377f955f856..6364e75db28 100644
--- a/contrib/sentry-native-cmake/CMakeLists.txt
+++ b/contrib/sentry-native-cmake/CMakeLists.txt
@@ -13,6 +13,7 @@ set (SRC_DIR "${ClickHouse_SOURCE_DIR}/contrib/sentry-native")
 
 set (SRCS
     ${SRC_DIR}/vendor/mpack.c
+    ${SRC_DIR}/vendor/stb_sprintf.c
     ${SRC_DIR}/src/sentry_alloc.c
     ${SRC_DIR}/src/sentry_backend.c
     ${SRC_DIR}/src/sentry_core.c
@@ -21,6 +22,7 @@ set (SRCS
     ${SRC_DIR}/src/sentry_json.c
     ${SRC_DIR}/src/sentry_logger.c
     ${SRC_DIR}/src/sentry_options.c
+    ${SRC_DIR}/src/sentry_os.c
     ${SRC_DIR}/src/sentry_random.c
     ${SRC_DIR}/src/sentry_ratelimiter.c
     ${SRC_DIR}/src/sentry_scope.c
@@ -29,6 +31,7 @@ set (SRCS
     ${SRC_DIR}/src/sentry_string.c
     ${SRC_DIR}/src/sentry_sync.c
     ${SRC_DIR}/src/sentry_transport.c
+    ${SRC_DIR}/src/sentry_tracing.c
     ${SRC_DIR}/src/sentry_utils.c
     ${SRC_DIR}/src/sentry_uuid.c
     ${SRC_DIR}/src/sentry_value.c
diff --git a/contrib/unixodbc-cmake/CMakeLists.txt b/contrib/unixodbc-cmake/CMakeLists.txt
index 3317654cd67..6fbe8c14ebb 100644
--- a/contrib/unixodbc-cmake/CMakeLists.txt
+++ b/contrib/unixodbc-cmake/CMakeLists.txt
@@ -1,7 +1,7 @@
 option (ENABLE_ODBC "Enable ODBC library" ${ENABLE_LIBRARIES})
-if (NOT OS_LINUX)
+if (NOT OS_LINUX OR USE_MUSL)
     if (ENABLE_ODBC)
-        message(STATUS "ODBC is only supported on Linux")
+        message(STATUS "ODBC is only supported on Linux with dynamic linking")
     endif()
     set (ENABLE_ODBC OFF CACHE INTERNAL "")
 endif ()
diff --git a/docker/images.json b/docker/images.json
index 1535715648c..d2f098f53d7 100644
--- a/docker/images.json
+++ b/docker/images.json
@@ -125,6 +125,7 @@
             "docker/test/server-jepsen",
             "docker/test/sqllogic",
             "docker/test/sqltest",
+            "docker/test/clickbench",
             "docker/test/stateless"
          ]
     },
@@ -145,6 +146,10 @@
         "name": "clickhouse/server-jepsen-test",
         "dependent": []
     },
+    "docker/test/clickbench": {
+        "name": "clickhouse/clickbench",
+        "dependent": []
+    },
     "docker/test/install/deb": {
         "name": "clickhouse/install-deb-test",
         "dependent": []
diff --git a/docker/keeper/Dockerfile b/docker/keeper/Dockerfile
index b174dfde675..145f5d13cc2 100644
--- a/docker/keeper/Dockerfile
+++ b/docker/keeper/Dockerfile
@@ -34,8 +34,9 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="23.10.5.20"
+ARG VERSION="23.12.1.1368"
 ARG PACKAGES="clickhouse-keeper"
+ARG DIRECT_DOWNLOAD_URLS=""
 
 # user/group precreated explicitly with fixed uid/gid on purpose.
 # It is especially important for rootless containers: in that case entrypoint
@@ -47,15 +48,27 @@ ARG PACKAGES="clickhouse-keeper"
 
 ARG TARGETARCH
 RUN arch=${TARGETARCH:-amd64} \
-    && for package in ${PACKAGES}; do \
-    ( \
-        cd /tmp \
-        && echo "Get ${REPOSITORY}/${package}-${VERSION}-${arch}.tgz" \
+    && cd /tmp && rm -f /tmp/*tgz && rm -f /tmp/*tgz.sha512 |: \
+    && if [ -n "${DIRECT_DOWNLOAD_URLS}" ]; then \
+        echo "installing from provided urls with tgz packages: ${DIRECT_DOWNLOAD_URLS}" \
+        && for url in $DIRECT_DOWNLOAD_URLS; do \
+            echo "Get ${url}" \
+            && wget -c -q "$url" \
+        ; done \
+    else \
+        for package in ${PACKAGES}; do \
+            cd /tmp \
+            && echo "Get ${REPOSITORY}/${package}-${VERSION}-${arch}.tgz" \
             && wget -c -q "${REPOSITORY}/${package}-${VERSION}-${arch}.tgz" \
             && wget -c -q "${REPOSITORY}/${package}-${VERSION}-${arch}.tgz.sha512" \
-            && sed 's:/output/:/tmp/:' < "${package}-${VERSION}-${arch}.tgz.sha512" | sha512sum -c \
-            && tar xvzf "${package}-${VERSION}-${arch}.tgz" --strip-components=1 -C / \
-    ) \
+        ; done \
+    fi \
+    && cat *.tgz.sha512 | sha512sum -c \
+    && for file in *.tgz; do \
+        if [ -f "$file" ]; then \
+            echo "Unpacking $file"; \
+            tar xvzf "$file" --strip-components=1 -C /; \
+        fi \
     ; done \
     && rm /tmp/*.tgz /install -r \
     && addgroup -S -g 101 clickhouse \
diff --git a/docker/packager/README.md b/docker/packager/README.md
index 3a91f9a63f0..e0b7f38ea58 100644
--- a/docker/packager/README.md
+++ b/docker/packager/README.md
@@ -3,10 +3,10 @@ compilers and build settings. Correctly configured Docker daemon is single depen
 
 Usage:
 
-Build deb package with `clang-14` in `debug` mode:
+Build deb package with `clang-17` in `debug` mode:
 ```
 $ mkdir deb/test_output
-$ ./packager --output-dir deb/test_output/ --package-type deb --compiler=clang-14 --debug-build
+$ ./packager --output-dir deb/test_output/ --package-type deb --compiler=clang-17 --debug-build
 $ ls -l deb/test_output
 -rw-r--r-- 1 root root      3730 clickhouse-client_22.2.2+debug_all.deb
 -rw-r--r-- 1 root root  84221888 clickhouse-common-static_22.2.2+debug_amd64.deb
@@ -17,11 +17,11 @@ $ ls -l deb/test_output
 
 ```
 
-Build ClickHouse binary with `clang-14` and `address` sanitizer in `relwithdebuginfo`
+Build ClickHouse binary with `clang-17` and `address` sanitizer in `relwithdebuginfo`
 mode:
 ```
 $ mkdir $HOME/some_clickhouse
-$ ./packager --output-dir=$HOME/some_clickhouse --package-type binary --compiler=clang-14 --sanitizer=address
+$ ./packager --output-dir=$HOME/some_clickhouse --package-type binary --compiler=clang-17 --sanitizer=address
 $ ls -l $HOME/some_clickhouse
 -rwxr-xr-x 1 root root 787061952  clickhouse
 lrwxrwxrwx 1 root root        10  clickhouse-benchmark -> clickhouse
diff --git a/docker/packager/binary/Dockerfile b/docker/packager/binary/Dockerfile
index 20fb97c80bb..1a99ab0d0b6 100644
--- a/docker/packager/binary/Dockerfile
+++ b/docker/packager/binary/Dockerfile
@@ -49,6 +49,7 @@ RUN curl https://sh.rustup.rs -sSf | bash -s -- -y && \
     chmod 777 -R /rust && \
     rustup toolchain install nightly-2023-07-04 && \
     rustup default nightly-2023-07-04 && \
+    rustup toolchain remove stable && \
     rustup component add rust-src && \
     rustup target add x86_64-unknown-linux-gnu && \
     rustup target add aarch64-unknown-linux-gnu && \
diff --git a/docker/packager/binary/build.sh b/docker/packager/binary/build.sh
index fd9bfcaabb2..b63643419fe 100755
--- a/docker/packager/binary/build.sh
+++ b/docker/packager/binary/build.sh
@@ -149,7 +149,7 @@ then
     mkdir -p "$PERF_OUTPUT"
     cp -r ../tests/performance "$PERF_OUTPUT"
     cp -r ../tests/config/top_level_domains  "$PERF_OUTPUT"
-    cp -r ../docker/test/performance-comparison/config "$PERF_OUTPUT" ||:
+    cp -r ../tests/performance/scripts/config "$PERF_OUTPUT" ||:
     for SRC in /output/clickhouse*; do
         # Copy all clickhouse* files except packages and bridges
         [[ "$SRC" != *.* ]] && [[ "$SRC" != *-bridge ]] && \
@@ -160,7 +160,7 @@ then
         ln -sf clickhouse "$PERF_OUTPUT"/clickhouse-keeper
     fi
 
-    cp -r ../docker/test/performance-comparison "$PERF_OUTPUT"/scripts ||:
+    cp -r ../tests/performance/scripts "$PERF_OUTPUT"/scripts ||:
     prepare_combined_output "$PERF_OUTPUT"
 
     # We have to know the revision that corresponds to this binary build.
diff --git a/docker/packager/packager b/docker/packager/packager
index b5bcbada1da..ade36a55591 100755
--- a/docker/packager/packager
+++ b/docker/packager/packager
@@ -145,6 +145,7 @@ def parse_env_variables(
     RISCV_SUFFIX = "-riscv64"
     S390X_SUFFIX = "-s390x"
     AMD64_COMPAT_SUFFIX = "-amd64-compat"
+    AMD64_MUSL_SUFFIX = "-amd64-musl"
 
     result = []
     result.append("OUTPUT_DIR=/output")
@@ -163,6 +164,7 @@ def parse_env_variables(
     is_cross_s390x = compiler.endswith(S390X_SUFFIX)
     is_cross_freebsd = compiler.endswith(FREEBSD_SUFFIX)
     is_amd64_compat = compiler.endswith(AMD64_COMPAT_SUFFIX)
+    is_amd64_musl = compiler.endswith(AMD64_MUSL_SUFFIX)
 
     if is_cross_darwin:
         cc = compiler[: -len(DARWIN_SUFFIX)]
@@ -232,6 +234,12 @@ def parse_env_variables(
         cc = compiler[: -len(AMD64_COMPAT_SUFFIX)]
         result.append("DEB_ARCH=amd64")
         cmake_flags.append("-DNO_SSE3_OR_HIGHER=1")
+    elif is_amd64_musl:
+        cc = compiler[: -len(AMD64_MUSL_SUFFIX)]
+        result.append("DEB_ARCH=amd64")
+        cmake_flags.append(
+            "-DCMAKE_TOOLCHAIN_FILE=/build/cmake/linux/toolchain-x86_64-musl.cmake"
+        )
     else:
         cc = compiler
         result.append("DEB_ARCH=amd64")
@@ -396,6 +404,7 @@ def parse_args() -> argparse.Namespace:
             "clang-17-riscv64",
             "clang-17-s390x",
             "clang-17-amd64-compat",
+            "clang-17-amd64-musl",
             "clang-17-freebsd",
         ),
         default="clang-17",
diff --git a/docker/server/Dockerfile.alpine b/docker/server/Dockerfile.alpine
index d4498abda6a..26d65eb3ccc 100644
--- a/docker/server/Dockerfile.alpine
+++ b/docker/server/Dockerfile.alpine
@@ -32,8 +32,9 @@ RUN arch=${TARGETARCH:-amd64} \
 # lts / testing / prestable / etc
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="https://packages.clickhouse.com/tgz/${REPO_CHANNEL}"
-ARG VERSION="23.10.5.20"
+ARG VERSION="23.12.1.1368"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
+ARG DIRECT_DOWNLOAD_URLS=""
 
 # user/group precreated explicitly with fixed uid/gid on purpose.
 # It is especially important for rootless containers: in that case entrypoint
@@ -43,15 +44,26 @@ ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 # The same uid / gid (101) is used both for alpine and ubuntu.
 
 RUN arch=${TARGETARCH:-amd64} \
-    && for package in ${PACKAGES}; do \
-    ( \
-        cd /tmp \
-        && echo "Get ${REPOSITORY}/${package}-${VERSION}-${arch}.tgz" \
+    && cd /tmp \
+    && if [ -n "${DIRECT_DOWNLOAD_URLS}" ]; then \
+        echo "installing from provided urls with tgz packages: ${DIRECT_DOWNLOAD_URLS}" \
+        && for url in $DIRECT_DOWNLOAD_URLS; do \
+            echo "Get ${url}" \
+            && wget -c -q "$url" \
+        ; done \
+    else \
+        for package in ${PACKAGES}; do \
+            echo "Get ${REPOSITORY}/${package}-${VERSION}-${arch}.tgz" \
             && wget -c -q "${REPOSITORY}/${package}-${VERSION}-${arch}.tgz" \
             && wget -c -q "${REPOSITORY}/${package}-${VERSION}-${arch}.tgz.sha512" \
-            && sed 's:/output/:/tmp/:' < "${package}-${VERSION}-${arch}.tgz.sha512" | sha512sum -c \
-            && tar xvzf "${package}-${VERSION}-${arch}.tgz" --strip-components=1 -C / \
-    ) \
+        ; done \
+    fi \
+    && cat *.tgz.sha512 | sed 's:/output/:/tmp/:' | sha512sum -c \
+    && for file in *.tgz; do \
+        if [ -f "$file" ]; then \
+            echo "Unpacking $file"; \
+            tar xvzf "$file" --strip-components=1 -C /; \
+        fi \
     ; done \
     && rm /tmp/*.tgz /install -r \
     && addgroup -S -g 101 clickhouse \
diff --git a/docker/server/Dockerfile.ubuntu b/docker/server/Dockerfile.ubuntu
index 08e95cd535b..5b96b208b11 100644
--- a/docker/server/Dockerfile.ubuntu
+++ b/docker/server/Dockerfile.ubuntu
@@ -30,13 +30,14 @@ RUN sed -i "s|http://archive.ubuntu.com|${apt_archive}|g" /etc/apt/sources.list
 
 ARG REPO_CHANNEL="stable"
 ARG REPOSITORY="deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb ${REPO_CHANNEL} main"
-ARG VERSION="23.10.5.20"
+ARG VERSION="23.12.1.1368"
 ARG PACKAGES="clickhouse-client clickhouse-server clickhouse-common-static"
 
 # set non-empty deb_location_url url to create a docker image
 # from debs created by CI build, for example:
 # docker build . --network host --build-arg version="21.4.1.6282" --build-arg deb_location_url="https://..." -t ...
 ARG deb_location_url=""
+ARG DIRECT_DOWNLOAD_URLS=""
 
 # set non-empty single_binary_location_url to create docker image
 # from a single binary url (useful for non-standard builds - with sanitizers, for arm64).
@@ -44,6 +45,18 @@ ARG single_binary_location_url=""
 
 ARG TARGETARCH
 
+# install from direct URL
+RUN if [ -n "${DIRECT_DOWNLOAD_URLS}" ]; then \
+        echo "installing from custom predefined urls with deb packages: ${DIRECT_DOWNLOAD_URLS}" \
+        && rm -rf /tmp/clickhouse_debs \
+        && mkdir -p /tmp/clickhouse_debs \
+        && for url in $DIRECT_DOWNLOAD_URLS; do \
+            wget --progress=bar:force:noscroll "$url" -P /tmp/clickhouse_debs || exit 1 \
+        ; done \
+        && dpkg -i /tmp/clickhouse_debs/*.deb \
+        && rm -rf /tmp/* ; \
+    fi
+
 # install from a web location with deb packages
 RUN arch="${TARGETARCH:-amd64}" \
     && if [ -n "${deb_location_url}" ]; then \
@@ -83,7 +96,7 @@ RUN if ! clickhouse local -q "SELECT ''" > /dev/null 2>&1; then \
         && GNUPGHOME="$GNUPGHOME" gpg --no-default-keyring \
             --keyring /usr/share/keyrings/clickhouse-keyring.gpg \
             --keyserver hkp://keyserver.ubuntu.com:80 --recv-keys 8919F6BD2B48D754 \
-        && rm -r "$GNUPGHOME" \
+        && rm -rf "$GNUPGHOME" \
         && chmod +r /usr/share/keyrings/clickhouse-keyring.gpg \
         && echo "${REPOSITORY}" > /etc/apt/sources.list.d/clickhouse.list \
         && echo "installing from repository: ${REPOSITORY}" \
diff --git a/docker/test/base/Dockerfile b/docker/test/base/Dockerfile
index b55baa0e0fc..b48017fdacc 100644
--- a/docker/test/base/Dockerfile
+++ b/docker/test/base/Dockerfile
@@ -12,6 +12,7 @@ RUN apt-get update \
         ripgrep \
         zstd \
         locales \
+        sudo \
         --yes --no-install-recommends
 
 # Sanitizer options for services (clickhouse-server)
diff --git a/docker/test/base/setup_export_logs.sh b/docker/test/base/setup_export_logs.sh
index 6e3721956c0..ea82e071112 100755
--- a/docker/test/base/setup_export_logs.sh
+++ b/docker/test/base/setup_export_logs.sh
@@ -21,7 +21,7 @@ EXTRA_ORDER_BY_COLUMNS=${EXTRA_ORDER_BY_COLUMNS:-"check_name, "}
 
 # trace_log needs more columns for symbolization
 EXTRA_COLUMNS_TRACE_LOG="${EXTRA_COLUMNS} symbols Array(LowCardinality(String)), lines Array(LowCardinality(String)), "
-EXTRA_COLUMNS_EXPRESSION_TRACE_LOG="${EXTRA_COLUMNS_EXPRESSION}, arrayMap(x -> toLowCardinality(demangle(addressToSymbol(x))), trace) AS symbols, arrayMap(x -> toLowCardinality(addressToLine(x)), trace) AS lines"
+EXTRA_COLUMNS_EXPRESSION_TRACE_LOG="${EXTRA_COLUMNS_EXPRESSION}, arrayMap(x -> demangle(addressToSymbol(x)), trace)::Array(LowCardinality(String)) AS symbols, arrayMap(x -> addressToLine(x), trace)::Array(LowCardinality(String)) AS lines"
 
 
 function __set_connection_args
diff --git a/docker/test/clickbench/Dockerfile b/docker/test/clickbench/Dockerfile
new file mode 100644
index 00000000000..0b6b1736e03
--- /dev/null
+++ b/docker/test/clickbench/Dockerfile
@@ -0,0 +1,10 @@
+ARG FROM_TAG=latest
+FROM clickhouse/test-base:$FROM_TAG
+
+ENV TZ=Europe/Amsterdam
+RUN ln -snf /usr/share/zoneinfo/$TZ /etc/localtime && echo $TZ > /etc/timezone
+
+COPY *.sh /
+COPY *.sql /
+
+CMD ["/bin/bash", "/run.sh"]
diff --git a/docker/test/clickbench/create.sql b/docker/test/clickbench/create.sql
new file mode 100644
index 00000000000..9f18a47474b
--- /dev/null
+++ b/docker/test/clickbench/create.sql
@@ -0,0 +1,112 @@
+ATTACH TABLE hits UUID 'c449dfbf-ba06-4d13-abec-8396559eb955'
+(
+    WatchID BIGINT NOT NULL,
+    JavaEnable SMALLINT NOT NULL,
+    Title TEXT NOT NULL,
+    GoodEvent SMALLINT NOT NULL,
+    EventTime TIMESTAMP NOT NULL,
+    EventDate Date NOT NULL,
+    CounterID INTEGER NOT NULL,
+    ClientIP INTEGER NOT NULL,
+    RegionID INTEGER NOT NULL,
+    UserID BIGINT NOT NULL,
+    CounterClass SMALLINT NOT NULL,
+    OS SMALLINT NOT NULL,
+    UserAgent SMALLINT NOT NULL,
+    URL TEXT NOT NULL,
+    Referer TEXT NOT NULL,
+    IsRefresh SMALLINT NOT NULL,
+    RefererCategoryID SMALLINT NOT NULL,
+    RefererRegionID INTEGER NOT NULL,
+    URLCategoryID SMALLINT NOT NULL,
+    URLRegionID INTEGER NOT NULL,
+    ResolutionWidth SMALLINT NOT NULL,
+    ResolutionHeight SMALLINT NOT NULL,
+    ResolutionDepth SMALLINT NOT NULL,
+    FlashMajor SMALLINT NOT NULL,
+    FlashMinor SMALLINT NOT NULL,
+    FlashMinor2 TEXT NOT NULL,
+    NetMajor SMALLINT NOT NULL,
+    NetMinor SMALLINT NOT NULL,
+    UserAgentMajor SMALLINT NOT NULL,
+    UserAgentMinor VARCHAR(255) NOT NULL,
+    CookieEnable SMALLINT NOT NULL,
+    JavascriptEnable SMALLINT NOT NULL,
+    IsMobile SMALLINT NOT NULL,
+    MobilePhone SMALLINT NOT NULL,
+    MobilePhoneModel TEXT NOT NULL,
+    Params TEXT NOT NULL,
+    IPNetworkID INTEGER NOT NULL,
+    TraficSourceID SMALLINT NOT NULL,
+    SearchEngineID SMALLINT NOT NULL,
+    SearchPhrase TEXT NOT NULL,
+    AdvEngineID SMALLINT NOT NULL,
+    IsArtifical SMALLINT NOT NULL,
+    WindowClientWidth SMALLINT NOT NULL,
+    WindowClientHeight SMALLINT NOT NULL,
+    ClientTimeZone SMALLINT NOT NULL,
+    ClientEventTime TIMESTAMP NOT NULL,
+    SilverlightVersion1 SMALLINT NOT NULL,
+    SilverlightVersion2 SMALLINT NOT NULL,
+    SilverlightVersion3 INTEGER NOT NULL,
+    SilverlightVersion4 SMALLINT NOT NULL,
+    PageCharset TEXT NOT NULL,
+    CodeVersion INTEGER NOT NULL,
+    IsLink SMALLINT NOT NULL,
+    IsDownload SMALLINT NOT NULL,
+    IsNotBounce SMALLINT NOT NULL,
+    FUniqID BIGINT NOT NULL,
+    OriginalURL TEXT NOT NULL,
+    HID INTEGER NOT NULL,
+    IsOldCounter SMALLINT NOT NULL,
+    IsEvent SMALLINT NOT NULL,
+    IsParameter SMALLINT NOT NULL,
+    DontCountHits SMALLINT NOT NULL,
+    WithHash SMALLINT NOT NULL,
+    HitColor CHAR NOT NULL,
+    LocalEventTime TIMESTAMP NOT NULL,
+    Age SMALLINT NOT NULL,
+    Sex SMALLINT NOT NULL,
+    Income SMALLINT NOT NULL,
+    Interests SMALLINT NOT NULL,
+    Robotness SMALLINT NOT NULL,
+    RemoteIP INTEGER NOT NULL,
+    WindowName INTEGER NOT NULL,
+    OpenerName INTEGER NOT NULL,
+    HistoryLength SMALLINT NOT NULL,
+    BrowserLanguage TEXT NOT NULL,
+    BrowserCountry TEXT NOT NULL,
+    SocialNetwork TEXT NOT NULL,
+    SocialAction TEXT NOT NULL,
+    HTTPError SMALLINT NOT NULL,
+    SendTiming INTEGER NOT NULL,
+    DNSTiming INTEGER NOT NULL,
+    ConnectTiming INTEGER NOT NULL,
+    ResponseStartTiming INTEGER NOT NULL,
+    ResponseEndTiming INTEGER NOT NULL,
+    FetchTiming INTEGER NOT NULL,
+    SocialSourceNetworkID SMALLINT NOT NULL,
+    SocialSourcePage TEXT NOT NULL,
+    ParamPrice BIGINT NOT NULL,
+    ParamOrderID TEXT NOT NULL,
+    ParamCurrency TEXT NOT NULL,
+    ParamCurrencyID SMALLINT NOT NULL,
+    OpenstatServiceName TEXT NOT NULL,
+    OpenstatCampaignID TEXT NOT NULL,
+    OpenstatAdID TEXT NOT NULL,
+    OpenstatSourceID TEXT NOT NULL,
+    UTMSource TEXT NOT NULL,
+    UTMMedium TEXT NOT NULL,
+    UTMCampaign TEXT NOT NULL,
+    UTMContent TEXT NOT NULL,
+    UTMTerm TEXT NOT NULL,
+    FromTag TEXT NOT NULL,
+    HasGCLID SMALLINT NOT NULL,
+    RefererHash BIGINT NOT NULL,
+    URLHash BIGINT NOT NULL,
+    CLID INTEGER NOT NULL,
+    PRIMARY KEY (CounterID, EventDate, UserID, EventTime, WatchID)
+)
+ENGINE = MergeTree
+SETTINGS disk = disk(type = cache, path = '/dev/shm/clickhouse/', max_size = '16G',
+         disk = disk(type = web, endpoint = 'https://clickhouse-datasets-web.s3.us-east-1.amazonaws.com/'));
diff --git a/docker/test/clickbench/queries.sql b/docker/test/clickbench/queries.sql
new file mode 100644
index 00000000000..31f65fc898d
--- /dev/null
+++ b/docker/test/clickbench/queries.sql
@@ -0,0 +1,43 @@
+SELECT COUNT(*) FROM hits;
+SELECT COUNT(*) FROM hits WHERE AdvEngineID <> 0;
+SELECT SUM(AdvEngineID), COUNT(*), AVG(ResolutionWidth) FROM hits;
+SELECT AVG(UserID) FROM hits;
+SELECT COUNT(DISTINCT UserID) FROM hits;
+SELECT COUNT(DISTINCT SearchPhrase) FROM hits;
+SELECT MIN(EventDate), MAX(EventDate) FROM hits;
+SELECT AdvEngineID, COUNT(*) FROM hits WHERE AdvEngineID <> 0 GROUP BY AdvEngineID ORDER BY COUNT(*) DESC;
+SELECT RegionID, COUNT(DISTINCT UserID) AS u FROM hits GROUP BY RegionID ORDER BY u DESC LIMIT 10;
+SELECT RegionID, SUM(AdvEngineID), COUNT(*) AS c, AVG(ResolutionWidth), COUNT(DISTINCT UserID) FROM hits GROUP BY RegionID ORDER BY c DESC LIMIT 10;
+SELECT MobilePhoneModel, COUNT(DISTINCT UserID) AS u FROM hits WHERE MobilePhoneModel <> '' GROUP BY MobilePhoneModel ORDER BY u DESC LIMIT 10;
+SELECT MobilePhone, MobilePhoneModel, COUNT(DISTINCT UserID) AS u FROM hits WHERE MobilePhoneModel <> '' GROUP BY MobilePhone, MobilePhoneModel ORDER BY u DESC LIMIT 10;
+SELECT SearchPhrase, COUNT(*) AS c FROM hits WHERE SearchPhrase <> '' GROUP BY SearchPhrase ORDER BY c DESC LIMIT 10;
+SELECT SearchPhrase, COUNT(DISTINCT UserID) AS u FROM hits WHERE SearchPhrase <> '' GROUP BY SearchPhrase ORDER BY u DESC LIMIT 10;
+SELECT SearchEngineID, SearchPhrase, COUNT(*) AS c FROM hits WHERE SearchPhrase <> '' GROUP BY SearchEngineID, SearchPhrase ORDER BY c DESC LIMIT 10;
+SELECT UserID, COUNT(*) FROM hits GROUP BY UserID ORDER BY COUNT(*) DESC LIMIT 10;
+SELECT UserID, SearchPhrase, COUNT(*) FROM hits GROUP BY UserID, SearchPhrase ORDER BY COUNT(*) DESC LIMIT 10;
+SELECT UserID, SearchPhrase, COUNT(*) FROM hits GROUP BY UserID, SearchPhrase LIMIT 10;
+SELECT UserID, extract(minute FROM EventTime) AS m, SearchPhrase, COUNT(*) FROM hits GROUP BY UserID, m, SearchPhrase ORDER BY COUNT(*) DESC LIMIT 10;
+SELECT UserID FROM hits WHERE UserID = 435090932899640449;
+SELECT COUNT(*) FROM hits WHERE URL LIKE '%google%';
+SELECT SearchPhrase, MIN(URL), COUNT(*) AS c FROM hits WHERE URL LIKE '%google%' AND SearchPhrase <> '' GROUP BY SearchPhrase ORDER BY c DESC LIMIT 10;
+SELECT SearchPhrase, MIN(URL), MIN(Title), COUNT(*) AS c, COUNT(DISTINCT UserID) FROM hits WHERE Title LIKE '%Google%' AND URL NOT LIKE '%.google.%' AND SearchPhrase <> '' GROUP BY SearchPhrase ORDER BY c DESC LIMIT 10;
+SELECT * FROM hits WHERE URL LIKE '%google%' ORDER BY EventTime LIMIT 10;
+SELECT SearchPhrase FROM hits WHERE SearchPhrase <> '' ORDER BY EventTime LIMIT 10;
+SELECT SearchPhrase FROM hits WHERE SearchPhrase <> '' ORDER BY SearchPhrase LIMIT 10;
+SELECT SearchPhrase FROM hits WHERE SearchPhrase <> '' ORDER BY EventTime, SearchPhrase LIMIT 10;
+SELECT CounterID, AVG(length(URL)) AS l, COUNT(*) AS c FROM hits WHERE URL <> '' GROUP BY CounterID HAVING COUNT(*) > 100000 ORDER BY l DESC LIMIT 25;
+SELECT REGEXP_REPLACE(Referer, '^https?://(?:www\.)?([^/]+)/.*$', '\1') AS k, AVG(length(Referer)) AS l, COUNT(*) AS c, MIN(Referer) FROM hits WHERE Referer <> '' GROUP BY k HAVING COUNT(*) > 100000 ORDER BY l DESC LIMIT 25;
+SELECT SUM(ResolutionWidth), SUM(ResolutionWidth + 1), SUM(ResolutionWidth + 2), SUM(ResolutionWidth + 3), SUM(ResolutionWidth + 4), SUM(ResolutionWidth + 5), SUM(ResolutionWidth + 6), SUM(ResolutionWidth + 7), SUM(ResolutionWidth + 8), SUM(ResolutionWidth + 9), SUM(ResolutionWidth + 10), SUM(ResolutionWidth + 11), SUM(ResolutionWidth + 12), SUM(ResolutionWidth + 13), SUM(ResolutionWidth + 14), SUM(ResolutionWidth + 15), SUM(ResolutionWidth + 16), SUM(ResolutionWidth + 17), SUM(ResolutionWidth + 18), SUM(ResolutionWidth + 19), SUM(ResolutionWidth + 20), SUM(ResolutionWidth + 21), SUM(ResolutionWidth + 22), SUM(ResolutionWidth + 23), SUM(ResolutionWidth + 24), SUM(ResolutionWidth + 25), SUM(ResolutionWidth + 26), SUM(ResolutionWidth + 27), SUM(ResolutionWidth + 28), SUM(ResolutionWidth + 29), SUM(ResolutionWidth + 30), SUM(ResolutionWidth + 31), SUM(ResolutionWidth + 32), SUM(ResolutionWidth + 33), SUM(ResolutionWidth + 34), SUM(ResolutionWidth + 35), SUM(ResolutionWidth + 36), SUM(ResolutionWidth + 37), SUM(ResolutionWidth + 38), SUM(ResolutionWidth + 39), SUM(ResolutionWidth + 40), SUM(ResolutionWidth + 41), SUM(ResolutionWidth + 42), SUM(ResolutionWidth + 43), SUM(ResolutionWidth + 44), SUM(ResolutionWidth + 45), SUM(ResolutionWidth + 46), SUM(ResolutionWidth + 47), SUM(ResolutionWidth + 48), SUM(ResolutionWidth + 49), SUM(ResolutionWidth + 50), SUM(ResolutionWidth + 51), SUM(ResolutionWidth + 52), SUM(ResolutionWidth + 53), SUM(ResolutionWidth + 54), SUM(ResolutionWidth + 55), SUM(ResolutionWidth + 56), SUM(ResolutionWidth + 57), SUM(ResolutionWidth + 58), SUM(ResolutionWidth + 59), SUM(ResolutionWidth + 60), SUM(ResolutionWidth + 61), SUM(ResolutionWidth + 62), SUM(ResolutionWidth + 63), SUM(ResolutionWidth + 64), SUM(ResolutionWidth + 65), SUM(ResolutionWidth + 66), SUM(ResolutionWidth + 67), SUM(ResolutionWidth + 68), SUM(ResolutionWidth + 69), SUM(ResolutionWidth + 70), SUM(ResolutionWidth + 71), SUM(ResolutionWidth + 72), SUM(ResolutionWidth + 73), SUM(ResolutionWidth + 74), SUM(ResolutionWidth + 75), SUM(ResolutionWidth + 76), SUM(ResolutionWidth + 77), SUM(ResolutionWidth + 78), SUM(ResolutionWidth + 79), SUM(ResolutionWidth + 80), SUM(ResolutionWidth + 81), SUM(ResolutionWidth + 82), SUM(ResolutionWidth + 83), SUM(ResolutionWidth + 84), SUM(ResolutionWidth + 85), SUM(ResolutionWidth + 86), SUM(ResolutionWidth + 87), SUM(ResolutionWidth + 88), SUM(ResolutionWidth + 89) FROM hits;
+SELECT SearchEngineID, ClientIP, COUNT(*) AS c, SUM(IsRefresh), AVG(ResolutionWidth) FROM hits WHERE SearchPhrase <> '' GROUP BY SearchEngineID, ClientIP ORDER BY c DESC LIMIT 10;
+SELECT WatchID, ClientIP, COUNT(*) AS c, SUM(IsRefresh), AVG(ResolutionWidth) FROM hits WHERE SearchPhrase <> '' GROUP BY WatchID, ClientIP ORDER BY c DESC LIMIT 10;
+SELECT WatchID, ClientIP, COUNT(*) AS c, SUM(IsRefresh), AVG(ResolutionWidth) FROM hits GROUP BY WatchID, ClientIP ORDER BY c DESC LIMIT 10;
+SELECT URL, COUNT(*) AS c FROM hits GROUP BY URL ORDER BY c DESC LIMIT 10;
+SELECT 1, URL, COUNT(*) AS c FROM hits GROUP BY 1, URL ORDER BY c DESC LIMIT 10;
+SELECT ClientIP, ClientIP - 1, ClientIP - 2, ClientIP - 3, COUNT(*) AS c FROM hits GROUP BY ClientIP, ClientIP - 1, ClientIP - 2, ClientIP - 3 ORDER BY c DESC LIMIT 10;
+SELECT URL, COUNT(*) AS PageViews FROM hits WHERE CounterID = 62 AND EventDate >= '2013-07-01' AND EventDate <= '2013-07-31' AND DontCountHits = 0 AND IsRefresh = 0 AND URL <> '' GROUP BY URL ORDER BY PageViews DESC LIMIT 10;
+SELECT Title, COUNT(*) AS PageViews FROM hits WHERE CounterID = 62 AND EventDate >= '2013-07-01' AND EventDate <= '2013-07-31' AND DontCountHits = 0 AND IsRefresh = 0 AND Title <> '' GROUP BY Title ORDER BY PageViews DESC LIMIT 10;
+SELECT URL, COUNT(*) AS PageViews FROM hits WHERE CounterID = 62 AND EventDate >= '2013-07-01' AND EventDate <= '2013-07-31' AND IsRefresh = 0 AND IsLink <> 0 AND IsDownload = 0 GROUP BY URL ORDER BY PageViews DESC LIMIT 10 OFFSET 1000;
+SELECT TraficSourceID, SearchEngineID, AdvEngineID, CASE WHEN (SearchEngineID = 0 AND AdvEngineID = 0) THEN Referer ELSE '' END AS Src, URL AS Dst, COUNT(*) AS PageViews FROM hits WHERE CounterID = 62 AND EventDate >= '2013-07-01' AND EventDate <= '2013-07-31' AND IsRefresh = 0 GROUP BY TraficSourceID, SearchEngineID, AdvEngineID, Src, Dst ORDER BY PageViews DESC LIMIT 10 OFFSET 1000;
+SELECT URLHash, EventDate, COUNT(*) AS PageViews FROM hits WHERE CounterID = 62 AND EventDate >= '2013-07-01' AND EventDate <= '2013-07-31' AND IsRefresh = 0 AND TraficSourceID IN (-1, 6) AND RefererHash = 3594120000172545465 GROUP BY URLHash, EventDate ORDER BY PageViews DESC LIMIT 10 OFFSET 100;
+SELECT WindowClientWidth, WindowClientHeight, COUNT(*) AS PageViews FROM hits WHERE CounterID = 62 AND EventDate >= '2013-07-01' AND EventDate <= '2013-07-31' AND IsRefresh = 0 AND DontCountHits = 0 AND URLHash = 2868770270353813622 GROUP BY WindowClientWidth, WindowClientHeight ORDER BY PageViews DESC LIMIT 10 OFFSET 10000;
+SELECT DATE_TRUNC('minute', EventTime) AS M, COUNT(*) AS PageViews FROM hits WHERE CounterID = 62 AND EventDate >= '2013-07-14' AND EventDate <= '2013-07-15' AND IsRefresh = 0 AND DontCountHits = 0 GROUP BY DATE_TRUNC('minute', EventTime) ORDER BY DATE_TRUNC('minute', EventTime) LIMIT 10 OFFSET 1000;
diff --git a/docker/test/clickbench/run.sh b/docker/test/clickbench/run.sh
new file mode 100755
index 00000000000..3d27a40bb74
--- /dev/null
+++ b/docker/test/clickbench/run.sh
@@ -0,0 +1,79 @@
+#!/bin/bash
+
+SCRIPT_PID=$!
+(sleep 1200 && kill -9 $SCRIPT_PID) &
+
+# shellcheck disable=SC1091
+source /setup_export_logs.sh
+
+# fail on errors, verbose and export all env variables
+set -e -x -a
+
+dpkg -i package_folder/clickhouse-common-static_*.deb
+dpkg -i package_folder/clickhouse-server_*.deb
+dpkg -i package_folder/clickhouse-client_*.deb
+
+# A directory for cache
+mkdir /dev/shm/clickhouse
+chown clickhouse:clickhouse /dev/shm/clickhouse
+
+# Allow introspection functions, needed for sending the logs
+echo "
+profiles:
+    default:
+        allow_introspection_functions: 1
+" > /etc/clickhouse-server/users.d/allow_introspection_functions.yaml
+
+# Enable text_log
+echo "
+text_log:
+" > /etc/clickhouse-server/config.d/text_log.yaml
+
+config_logs_export_cluster /etc/clickhouse-server/config.d/system_logs_export.yaml
+
+clickhouse start
+
+# Wait for the server to start, but not for too long.
+for _ in {1..100}
+do
+    clickhouse-client --query "SELECT 1" && break
+    sleep 1
+done
+
+setup_logs_replication
+
+# Load the data
+
+clickhouse-client --time < /create.sql
+
+# Run the queries
+
+set +x
+
+TRIES=3
+QUERY_NUM=1
+while read -r query; do
+    echo -n "["
+    for i in $(seq 1 $TRIES); do
+        RES=$(clickhouse-client --query_id "q${QUERY_NUM}-${i}" --time --format Null --query "$query" --progress 0 2>&1 ||:)
+        echo -n "${RES}"
+        [[ "$i" != "$TRIES" ]] && echo -n ", "
+
+        echo "${QUERY_NUM},${i},${RES}" >> /test_output/test_results.tsv
+    done
+    echo "],"
+
+    QUERY_NUM=$((QUERY_NUM + 1))
+done < /queries.sql
+
+set -x
+
+clickhouse-client --query "SELECT total_bytes FROM system.tables WHERE name = 'hits' AND database = 'default'"
+
+clickhouse-client -q "system flush logs" ||:
+stop_logs_replication
+clickhouse stop
+
+mv /var/log/clickhouse-server/* /test_output/
+
+echo -e "success\tClickBench finished" > /test_output/check_status.tsv
diff --git a/docker/test/fasttest/run.sh b/docker/test/fasttest/run.sh
index d3695ba2613..5af05034415 100755
--- a/docker/test/fasttest/run.sh
+++ b/docker/test/fasttest/run.sh
@@ -16,7 +16,7 @@ export LLVM_VERSION=${LLVM_VERSION:-17}
 # it being undefined. Also read it as array so that we can pass an empty list
 # of additional variable to cmake properly, and it doesn't generate an extra
 # empty parameter.
-# Read it as CMAKE_FLAGS to not lose exported FASTTEST_CMAKE_FLAGS on subsequential launch
+# Read it as CMAKE_FLAGS to not lose exported FASTTEST_CMAKE_FLAGS on subsequent launch
 read -ra CMAKE_FLAGS <<< "${FASTTEST_CMAKE_FLAGS:-}"
 
 # Run only matching tests.
@@ -197,7 +197,7 @@ function run_cmake
 
     (
         cd "$FASTTEST_BUILD"
-        cmake "$FASTTEST_SOURCE" -DCMAKE_CXX_COMPILER="clang++-${LLVM_VERSION}" -DCMAKE_C_COMPILER="clang-${LLVM_VERSION}" "${CMAKE_LIBS_CONFIG[@]}" "${CMAKE_FLAGS[@]}" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee "$FASTTEST_OUTPUT/cmake_log.txt"
+        cmake "$FASTTEST_SOURCE" -DCMAKE_CXX_COMPILER="clang++-${LLVM_VERSION}" -DCMAKE_C_COMPILER="clang-${LLVM_VERSION}" -DCMAKE_TOOLCHAIN_FILE="${FASTTEST_SOURCE}/cmake/linux/toolchain-x86_64-musl.cmake" "${CMAKE_LIBS_CONFIG[@]}" "${CMAKE_FLAGS[@]}" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee "$FASTTEST_OUTPUT/cmake_log.txt"
     )
 }
 
diff --git a/docker/test/integration/helper_container/Dockerfile b/docker/test/integration/helper_container/Dockerfile
index 60adaea1796..49a3d3cd84b 100644
--- a/docker/test/integration/helper_container/Dockerfile
+++ b/docker/test/integration/helper_container/Dockerfile
@@ -1,7 +1,7 @@
 # docker build -t clickhouse/integration-helper .
 # Helper docker container to run iptables without sudo
 
-FROM alpine
+FROM alpine:3.18
 RUN apk add --no-cache -U iproute2 \
   && for bin in iptables iptables-restore iptables-save; \
     do ln -sf xtables-nft-multi "/sbin/$bin"; \
diff --git a/docker/test/integration/runner/Dockerfile b/docker/test/integration/runner/Dockerfile
index 458ca2b1da8..c795fbf0672 100644
--- a/docker/test/integration/runner/Dockerfile
+++ b/docker/test/integration/runner/Dockerfile
@@ -74,7 +74,7 @@ RUN python3 -m pip install --no-cache-dir \
     delta-spark==2.3.0 \
     dict2xml \
     dicttoxml \
-    docker \
+    docker==6.1.3 \
     docker-compose==1.29.2 \
     grpcio \
     grpcio-tools \
diff --git a/docker/test/integration/runner/compose/docker_compose_minio.yml b/docker/test/integration/runner/compose/docker_compose_minio.yml
index 45e55e7a79c..4255a529f6d 100644
--- a/docker/test/integration/runner/compose/docker_compose_minio.yml
+++ b/docker/test/integration/runner/compose/docker_compose_minio.yml
@@ -34,7 +34,7 @@ services:
 
   # Empty container to run proxy resolver.
   resolver:
-    image: clickhouse/python-bottle
+    image: clickhouse/python-bottle:${DOCKER_PYTHON_BOTTLE_TAG:-latest}
     expose:
       - "8080"
     tty: true
diff --git a/docker/test/performance-comparison/Dockerfile b/docker/test/performance-comparison/Dockerfile
index d31663f9071..e4ced104445 100644
--- a/docker/test/performance-comparison/Dockerfile
+++ b/docker/test/performance-comparison/Dockerfile
@@ -39,18 +39,8 @@ RUN apt-get update \
     && apt-get clean \
     && rm -rf /var/lib/apt/lists/*
 
-COPY * /
+COPY run.sh /
 
-# Bind everything to one NUMA node, if there's more than one. Theoretically the
-# node #0 should be less stable because of system interruptions. We bind
-# randomly to node 1 or 0 to gather some statistics on that. We have to bind
-# both servers and the tmpfs on which the database is stored. How to do it
-# is unclear, but by default tmpfs uses
-# 'process allocation policy', not sure which process but hopefully the one that
-# writes to it, so just bind the downloader script as well.
-# https://www.kernel.org/doc/Documentation/filesystems/tmpfs.txt
-# Double-escaped backslashes are a tribute to the engineering wonder of docker --
-# it gives '/bin/sh: 1: [bash,: not found' otherwise.
-CMD ["bash", "-c", "node=$((RANDOM % $(numactl --hardware | sed -n 's/^.*available:\\(.*\\)nodes.*$/\\1/p'))); echo Will bind to NUMA node $node; numactl --cpunodebind=$node --membind=$node /entrypoint.sh"]
+CMD ["bash", "/run.sh"]
 
 # docker run --network=host --volume <workspace>:/workspace --volume=<output>:/output -e PR_TO_TEST=<> -e SHA_TO_TEST=<> clickhouse/performance-comparison
diff --git a/docker/test/performance-comparison/run.sh b/docker/test/performance-comparison/run.sh
new file mode 100644
index 00000000000..7afb5da59b1
--- /dev/null
+++ b/docker/test/performance-comparison/run.sh
@@ -0,0 +1,18 @@
+#!/bin/bash
+
+entry="/usr/share/clickhouse-test/performance/scripts/entrypoint.sh"
+[ ! -e "$entry" ] && echo "ERROR: test scripts are not found" && exit 1
+
+# Bind everything to one NUMA node, if there's more than one. Theoretically the
+# node #0 should be less stable because of system interruptions. We bind
+# randomly to node 1 or 0 to gather some statistics on that. We have to bind
+# both servers and the tmpfs on which the database is stored. How to do it
+# is unclear, but by default tmpfs uses
+# 'process allocation policy', not sure which process but hopefully the one that
+# writes to it, so just bind the downloader script as well.
+# https://www.kernel.org/doc/Documentation/filesystems/tmpfs.txt
+# Double-escaped backslashes are a tribute to the engineering wonder of docker --
+# it gives '/bin/sh: 1: [bash,: not found' otherwise.
+node=$(( RANDOM % $(numactl --hardware | sed -n 's/^.*available:\(.*\)nodes.*$/\1/p') ));
+echo Will bind to NUMA node $node;
+numactl --cpunodebind=$node --membind=$node $entry
diff --git a/docker/test/sqllogic/Dockerfile b/docker/test/sqllogic/Dockerfile
index 5cf71e4d3f8..48457a99de3 100644
--- a/docker/test/sqllogic/Dockerfile
+++ b/docker/test/sqllogic/Dockerfile
@@ -20,7 +20,8 @@ RUN apt-get update --yes \
 RUN pip3 install \
     numpy \
     pyodbc \
-    deepdiff
+    deepdiff \
+    sqlglot
 
 ARG odbc_repo="https://github.com/ClickHouse/clickhouse-odbc.git"
 
@@ -35,7 +36,7 @@ RUN git clone --recursive ${odbc_repo} \
     && odbcinst -i -s -l -f /clickhouse-odbc/packaging/odbc.ini.sample
 
 ENV TZ=Europe/Amsterdam
-ENV MAX_RUN_TIME=900
+ENV MAX_RUN_TIME=9000
 RUN ln -snf /usr/share/zoneinfo/$TZ /etc/localtime && echo $TZ > /etc/timezone
 
 ARG sqllogic_test_repo="https://github.com/gregrahn/sqllogictest.git"
diff --git a/docker/test/sqllogic/run.sh b/docker/test/sqllogic/run.sh
index db828741b0d..ccba344035e 100755
--- a/docker/test/sqllogic/run.sh
+++ b/docker/test/sqllogic/run.sh
@@ -75,6 +75,20 @@ function run_tests()
         cat /test_output/statements-test/check_status.tsv >> /test_output/check_status.tsv
         cat /test_output/statements-test/test_results.tsv >> /test_output/test_results.tsv
         tar -zcvf statements-check.tar.gz statements-test 1>/dev/null
+
+        mkdir -p /test_output/complete-test
+        /clickhouse-tests/sqllogic/runner.py \
+        --log-file /test_output/runner-complete-test.log \
+        --log-level info \
+            complete-test \
+            --input-dir /sqllogictest \
+            --out-dir /test_output/complete-test \
+            2>&1 \
+            | ts '%Y-%m-%d %H:%M:%S'
+
+        cat /test_output/complete-test/check_status.tsv >> /test_output/check_status.tsv
+        cat /test_output/complete-test/test_results.tsv >> /test_output/test_results.tsv
+        tar -zcvf complete-check.tar.gz complete-test 1>/dev/null
     fi
 }
 
diff --git a/docker/test/stateful/run.sh b/docker/test/stateful/run.sh
index ad3c3477b37..c9ce5697182 100755
--- a/docker/test/stateful/run.sh
+++ b/docker/test/stateful/run.sh
@@ -24,6 +24,28 @@ azurite-blob --blobHost 0.0.0.0 --blobPort 10000 --debug /azurite_log &
 
 config_logs_export_cluster /etc/clickhouse-server/config.d/system_logs_export.yaml
 
+cache_policy=""
+if [ $(( $(date +%-d) % 2 )) -eq 1 ]; then
+    cache_policy="SLRU"
+else
+    cache_policy="LRU"
+fi
+
+echo "Using cache policy: $cache_policy"
+
+if [ "$cache_policy" = "SLRU" ]; then
+    sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
+    | sed "s|<cache_policy>LRU</cache_policy>|<cache_policy>SLRU</cache_policy>|" \
+    > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
+    mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
+fi
+
+if [[ -n "$USE_S3_STORAGE_FOR_MERGE_TREE" ]] && [[ "$USE_S3_STORAGE_FOR_MERGE_TREE" -eq 1 ]]; then
+    # It is not needed, we will explicitly create tables on s3.
+    # We do not have statefull tests with s3 storage run in public repository, but this is needed for another repository.
+    rm /etc/clickhouse-server/config.d/s3_storage_policy_for_merge_tree_by_default.xml
+fi
+
 function start()
 {
     if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]; then
@@ -107,8 +129,76 @@ if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]
 else
     clickhouse-client --query "CREATE DATABASE test"
     clickhouse-client --query "SHOW TABLES FROM test"
-    clickhouse-client --query "RENAME TABLE datasets.hits_v1 TO test.hits"
-    clickhouse-client --query "RENAME TABLE datasets.visits_v1 TO test.visits"
+    if [[ -n "$USE_S3_STORAGE_FOR_MERGE_TREE" ]] && [[ "$USE_S3_STORAGE_FOR_MERGE_TREE" -eq 1 ]]; then
+        clickhouse-client --query "CREATE TABLE test.hits (WatchID UInt64,  JavaEnable UInt8,  Title String,  GoodEvent Int16,
+            EventTime DateTime,  EventDate Date,  CounterID UInt32,  ClientIP UInt32,  ClientIP6 FixedString(16),  RegionID UInt32,
+            UserID UInt64,  CounterClass Int8,  OS UInt8,  UserAgent UInt8,  URL String,  Referer String,  URLDomain String,
+            RefererDomain String,  Refresh UInt8,  IsRobot UInt8,  RefererCategories Array(UInt16),  URLCategories Array(UInt16),
+            URLRegions Array(UInt32),  RefererRegions Array(UInt32),  ResolutionWidth UInt16,  ResolutionHeight UInt16,  ResolutionDepth UInt8,
+            FlashMajor UInt8, FlashMinor UInt8,  FlashMinor2 String,  NetMajor UInt8,  NetMinor UInt8, UserAgentMajor UInt16,
+            UserAgentMinor FixedString(2),  CookieEnable UInt8, JavascriptEnable UInt8,  IsMobile UInt8,  MobilePhone UInt8,
+            MobilePhoneModel String,  Params String,  IPNetworkID UInt32,  TraficSourceID Int8, SearchEngineID UInt16,
+            SearchPhrase String,  AdvEngineID UInt8,  IsArtifical UInt8,  WindowClientWidth UInt16,  WindowClientHeight UInt16,
+            ClientTimeZone Int16,  ClientEventTime DateTime,  SilverlightVersion1 UInt8, SilverlightVersion2 UInt8,  SilverlightVersion3 UInt32,
+            SilverlightVersion4 UInt16,  PageCharset String,  CodeVersion UInt32,  IsLink UInt8,  IsDownload UInt8,  IsNotBounce UInt8,
+            FUniqID UInt64,  HID UInt32,  IsOldCounter UInt8, IsEvent UInt8,  IsParameter UInt8,  DontCountHits UInt8,  WithHash UInt8,
+            HitColor FixedString(1),  UTCEventTime DateTime,  Age UInt8,  Sex UInt8,  Income UInt8,  Interests UInt16,  Robotness UInt8,
+            GeneralInterests Array(UInt16), RemoteIP UInt32,  RemoteIP6 FixedString(16),  WindowName Int32,  OpenerName Int32,
+            HistoryLength Int16,  BrowserLanguage FixedString(2),  BrowserCountry FixedString(2),  SocialNetwork String,  SocialAction String,
+            HTTPError UInt16, SendTiming Int32,  DNSTiming Int32,  ConnectTiming Int32,  ResponseStartTiming Int32,  ResponseEndTiming Int32,
+            FetchTiming Int32,  RedirectTiming Int32, DOMInteractiveTiming Int32,  DOMContentLoadedTiming Int32,  DOMCompleteTiming Int32,
+            LoadEventStartTiming Int32,  LoadEventEndTiming Int32, NSToDOMContentLoadedTiming Int32,  FirstPaintTiming Int32,
+            RedirectCount Int8, SocialSourceNetworkID UInt8,  SocialSourcePage String,  ParamPrice Int64, ParamOrderID String,
+            ParamCurrency FixedString(3),  ParamCurrencyID UInt16, GoalsReached Array(UInt32),  OpenstatServiceName String,
+            OpenstatCampaignID String,  OpenstatAdID String,  OpenstatSourceID String,  UTMSource String, UTMMedium String,
+            UTMCampaign String,  UTMContent String,  UTMTerm String, FromTag String,  HasGCLID UInt8,  RefererHash UInt64,
+            URLHash UInt64,  CLID UInt32,  YCLID UInt64,  ShareService String,  ShareURL String,  ShareTitle String,
+            ParsedParams Nested(Key1 String,  Key2 String, Key3 String, Key4 String, Key5 String,  ValueDouble Float64),
+            IslandID FixedString(16),  RequestNum UInt32,  RequestTry UInt8) ENGINE = MergeTree() PARTITION BY toYYYYMM(EventDate)
+            ORDER BY (CounterID, EventDate, intHash32(UserID)) SAMPLE BY intHash32(UserID) SETTINGS index_granularity = 8192, storage_policy='s3_cache'"
+        clickhouse-client --query "CREATE TABLE test.visits (CounterID UInt32,  StartDate Date,  Sign Int8,  IsNew UInt8,
+            VisitID UInt64,  UserID UInt64,  StartTime DateTime,  Duration UInt32,  UTCStartTime DateTime,  PageViews Int32,
+            Hits Int32,  IsBounce UInt8,  Referer String,  StartURL String,  RefererDomain String,  StartURLDomain String,
+            EndURL String,  LinkURL String,  IsDownload UInt8,  TraficSourceID Int8,  SearchEngineID UInt16,  SearchPhrase String,
+            AdvEngineID UInt8,  PlaceID Int32,  RefererCategories Array(UInt16),  URLCategories Array(UInt16),  URLRegions Array(UInt32),
+            RefererRegions Array(UInt32),  IsYandex UInt8,  GoalReachesDepth Int32,  GoalReachesURL Int32,  GoalReachesAny Int32,
+            SocialSourceNetworkID UInt8,  SocialSourcePage String,  MobilePhoneModel String,  ClientEventTime DateTime,  RegionID UInt32,
+            ClientIP UInt32,  ClientIP6 FixedString(16),  RemoteIP UInt32,  RemoteIP6 FixedString(16),  IPNetworkID UInt32,
+            SilverlightVersion3 UInt32,  CodeVersion UInt32,  ResolutionWidth UInt16,  ResolutionHeight UInt16,  UserAgentMajor UInt16,
+            UserAgentMinor UInt16,  WindowClientWidth UInt16,  WindowClientHeight UInt16,  SilverlightVersion2 UInt8,  SilverlightVersion4 UInt16,
+            FlashVersion3 UInt16,  FlashVersion4 UInt16,  ClientTimeZone Int16,  OS UInt8,  UserAgent UInt8,  ResolutionDepth UInt8,
+            FlashMajor UInt8,  FlashMinor UInt8,  NetMajor UInt8,  NetMinor UInt8,  MobilePhone UInt8,  SilverlightVersion1 UInt8,
+            Age UInt8,  Sex UInt8,  Income UInt8,  JavaEnable UInt8,  CookieEnable UInt8,  JavascriptEnable UInt8,  IsMobile UInt8,
+            BrowserLanguage UInt16,  BrowserCountry UInt16,  Interests UInt16,  Robotness UInt8,  GeneralInterests Array(UInt16),
+            Params Array(String),  Goals Nested(ID UInt32, Serial UInt32, EventTime DateTime,  Price Int64,  OrderID String, CurrencyID UInt32),
+            WatchIDs Array(UInt64),  ParamSumPrice Int64,  ParamCurrency FixedString(3),  ParamCurrencyID UInt16,  ClickLogID UInt64,
+            ClickEventID Int32,  ClickGoodEvent Int32,  ClickEventTime DateTime,  ClickPriorityID Int32,  ClickPhraseID Int32,  ClickPageID Int32,
+            ClickPlaceID Int32,  ClickTypeID Int32,  ClickResourceID Int32,  ClickCost UInt32,  ClickClientIP UInt32,  ClickDomainID UInt32,
+            ClickURL String,  ClickAttempt UInt8,  ClickOrderID UInt32,  ClickBannerID UInt32,  ClickMarketCategoryID UInt32,  ClickMarketPP UInt32,
+            ClickMarketCategoryName String,  ClickMarketPPName String,  ClickAWAPSCampaignName String,  ClickPageName String,  ClickTargetType UInt16,
+            ClickTargetPhraseID UInt64,  ClickContextType UInt8,  ClickSelectType Int8,  ClickOptions String,  ClickGroupBannerID Int32,
+            OpenstatServiceName String,  OpenstatCampaignID String,  OpenstatAdID String,  OpenstatSourceID String,  UTMSource String,
+            UTMMedium String,  UTMCampaign String,  UTMContent String,  UTMTerm String,  FromTag String,  HasGCLID UInt8,  FirstVisit DateTime,
+            PredLastVisit Date,  LastVisit Date,  TotalVisits UInt32,  TraficSource    Nested(ID Int8,  SearchEngineID UInt16, AdvEngineID UInt8,
+            PlaceID UInt16, SocialSourceNetworkID UInt8, Domain String, SearchPhrase String, SocialSourcePage String),  Attendance FixedString(16),
+            CLID UInt32,  YCLID UInt64,  NormalizedRefererHash UInt64,  SearchPhraseHash UInt64,  RefererDomainHash UInt64,  NormalizedStartURLHash UInt64,
+            StartURLDomainHash UInt64,  NormalizedEndURLHash UInt64,  TopLevelDomain UInt64,  URLScheme UInt64,  OpenstatServiceNameHash UInt64,
+            OpenstatCampaignIDHash UInt64,  OpenstatAdIDHash UInt64,  OpenstatSourceIDHash UInt64,  UTMSourceHash UInt64,  UTMMediumHash UInt64,
+            UTMCampaignHash UInt64,  UTMContentHash UInt64,  UTMTermHash UInt64,  FromHash UInt64,  WebVisorEnabled UInt8,  WebVisorActivity UInt32,
+            ParsedParams    Nested(Key1 String,  Key2 String,  Key3 String,  Key4 String, Key5 String, ValueDouble    Float64),
+            Market Nested(Type UInt8, GoalID UInt32, OrderID String,  OrderPrice Int64,  PP UInt32,  DirectPlaceID UInt32,  DirectOrderID  UInt32,
+            DirectBannerID UInt32,  GoodID String, GoodName String, GoodQuantity Int32,  GoodPrice Int64),  IslandID FixedString(16))
+            ENGINE = CollapsingMergeTree(Sign) PARTITION BY toYYYYMM(StartDate) ORDER BY (CounterID, StartDate, intHash32(UserID), VisitID)
+            SAMPLE BY intHash32(UserID) SETTINGS index_granularity = 8192, storage_policy='s3_cache'"
+
+        clickhouse-client --query "INSERT INTO test.hits SELECT * FROM datasets.hits_v1 SETTINGS enable_filesystem_cache_on_write_operations=0"
+        clickhouse-client --query "INSERT INTO test.visits SELECT * FROM datasets.visits_v1 SETTINGS enable_filesystem_cache_on_write_operations=0"
+        clickhouse-client --query "DROP TABLE datasets.visits_v1 SYNC"
+        clickhouse-client --query "DROP TABLE datasets.hits_v1 SYNC"
+    else
+        clickhouse-client --query "RENAME TABLE datasets.hits_v1 TO test.hits"
+        clickhouse-client --query "RENAME TABLE datasets.visits_v1 TO test.visits"
+    fi
     clickhouse-client --query "CREATE TABLE test.hits_s3  (WatchID UInt64, JavaEnable UInt8, Title String, GoodEvent Int16, EventTime DateTime, EventDate Date, CounterID UInt32, ClientIP UInt32, ClientIP6 FixedString(16), RegionID UInt32, UserID UInt64, CounterClass Int8, OS UInt8, UserAgent UInt8, URL String, Referer String, URLDomain String, RefererDomain String, Refresh UInt8, IsRobot UInt8, RefererCategories Array(UInt16), URLCategories Array(UInt16), URLRegions Array(UInt32), RefererRegions Array(UInt32), ResolutionWidth UInt16, ResolutionHeight UInt16, ResolutionDepth UInt8, FlashMajor UInt8, FlashMinor UInt8, FlashMinor2 String, NetMajor UInt8, NetMinor UInt8, UserAgentMajor UInt16, UserAgentMinor FixedString(2), CookieEnable UInt8, JavascriptEnable UInt8, IsMobile UInt8, MobilePhone UInt8, MobilePhoneModel String, Params String, IPNetworkID UInt32, TraficSourceID Int8, SearchEngineID UInt16, SearchPhrase String, AdvEngineID UInt8, IsArtifical UInt8, WindowClientWidth UInt16, WindowClientHeight UInt16, ClientTimeZone Int16, ClientEventTime DateTime, SilverlightVersion1 UInt8, SilverlightVersion2 UInt8, SilverlightVersion3 UInt32, SilverlightVersion4 UInt16, PageCharset String, CodeVersion UInt32, IsLink UInt8, IsDownload UInt8, IsNotBounce UInt8, FUniqID UInt64, HID UInt32, IsOldCounter UInt8, IsEvent UInt8, IsParameter UInt8, DontCountHits UInt8, WithHash UInt8, HitColor FixedString(1), UTCEventTime DateTime, Age UInt8, Sex UInt8, Income UInt8, Interests UInt16, Robotness UInt8, GeneralInterests Array(UInt16), RemoteIP UInt32, RemoteIP6 FixedString(16), WindowName Int32, OpenerName Int32, HistoryLength Int16, BrowserLanguage FixedString(2), BrowserCountry FixedString(2), SocialNetwork String, SocialAction String, HTTPError UInt16, SendTiming Int32, DNSTiming Int32, ConnectTiming Int32, ResponseStartTiming Int32, ResponseEndTiming Int32, FetchTiming Int32, RedirectTiming Int32, DOMInteractiveTiming Int32, DOMContentLoadedTiming Int32, DOMCompleteTiming Int32, LoadEventStartTiming Int32, LoadEventEndTiming Int32, NSToDOMContentLoadedTiming Int32, FirstPaintTiming Int32, RedirectCount Int8, SocialSourceNetworkID UInt8, SocialSourcePage String, ParamPrice Int64, ParamOrderID String, ParamCurrency FixedString(3), ParamCurrencyID UInt16, GoalsReached Array(UInt32), OpenstatServiceName String, OpenstatCampaignID String, OpenstatAdID String, OpenstatSourceID String, UTMSource String, UTMMedium String, UTMCampaign String, UTMContent String, UTMTerm String, FromTag String, HasGCLID UInt8, RefererHash UInt64, URLHash UInt64, CLID UInt32, YCLID UInt64, ShareService String, ShareURL String, ShareTitle String, ParsedParams Nested(Key1 String, Key2 String, Key3 String, Key4 String, Key5 String, ValueDouble Float64), IslandID FixedString(16), RequestNum UInt32, RequestTry UInt8) ENGINE = MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate, intHash32(UserID)) SAMPLE BY intHash32(UserID) SETTINGS index_granularity = 8192, storage_policy='s3_cache'"
     clickhouse-client --query "INSERT INTO test.hits_s3 SELECT * FROM test.hits SETTINGS enable_filesystem_cache_on_write_operations=0"
 fi
@@ -128,6 +218,10 @@ function run_tests()
         ADDITIONAL_OPTIONS+=('--replicated-database')
     fi
 
+    if [[ -n "$USE_S3_STORAGE_FOR_MERGE_TREE" ]] && [[ "$USE_S3_STORAGE_FOR_MERGE_TREE" -eq 1 ]]; then
+        ADDITIONAL_OPTIONS+=('--s3-storage')
+    fi
+
     if [[ -n "$USE_DATABASE_ORDINARY" ]] && [[ "$USE_DATABASE_ORDINARY" -eq 1 ]]; then
         ADDITIONAL_OPTIONS+=('--db-engine=Ordinary')
     fi
@@ -135,7 +229,7 @@ function run_tests()
     set +e
 
     if [[ -n "$USE_PARALLEL_REPLICAS" ]] && [[ "$USE_PARALLEL_REPLICAS" -eq 1 ]]; then
-        clickhouse-test --client="clickhouse-client --use_hedged_requests=0  --allow_experimental_parallel_reading_from_replicas=1 --parallel_replicas_for_non_replicated_merge_tree=1 \
+        clickhouse-test --client="clickhouse-client --allow_experimental_parallel_reading_from_replicas=1 --parallel_replicas_for_non_replicated_merge_tree=1 \
             --max_parallel_replicas=100 --cluster_for_parallel_replicas='parallel_replicas'" \
             -j 2 --testname --shard --zookeeper --check-zookeeper-session --no-stateless --no-parallel-replicas --hung-check --print-time "${ADDITIONAL_OPTIONS[@]}" \
         "$SKIP_TESTS_OPTION" 2>&1 | ts '%Y-%m-%d %H:%M:%S' | tee test_output/test_result.txt
diff --git a/docker/test/stateful/s3downloader b/docker/test/stateful/s3downloader
index 96f2aa96dd5..77601fb5af6 100755
--- a/docker/test/stateful/s3downloader
+++ b/docker/test/stateful/s3downloader
@@ -30,7 +30,7 @@ def build_url(base_url, dataset):
     return os.path.join(base_url, dataset, "partitions", AVAILABLE_DATASETS[dataset])
 
 
-def dowload_with_progress(url, path):
+def download_with_progress(url, path):
     logging.info("Downloading from %s to temp path %s", url, path)
     for i in range(RETRIES_COUNT):
         try:
@@ -110,7 +110,7 @@ if __name__ == "__main__":
         temp_archive_path = _get_temp_file_name()
         try:
             download_url_for_dataset = build_url(args.url_prefix, dataset)
-            dowload_with_progress(download_url_for_dataset, temp_archive_path)
+            download_with_progress(download_url_for_dataset, temp_archive_path)
             unpack_to_clickhouse_directory(temp_archive_path, args.clickhouse_data_path)
         except Exception as ex:
             logging.info("Some exception occured %s", str(ex))
diff --git a/docker/test/stateless/run.sh b/docker/test/stateless/run.sh
index a2e2a708aaf..4e9486d7286 100755
--- a/docker/test/stateless/run.sh
+++ b/docker/test/stateless/run.sh
@@ -58,6 +58,7 @@ if [[ -n "$BUGFIX_VALIDATE_CHECK" ]] && [[ "$BUGFIX_VALIDATE_CHECK" -eq 1 ]]; th
 
     # it contains some new settings, but we can safely remove it
     rm /etc/clickhouse-server/users.d/s3_cache_new.xml
+    rm /etc/clickhouse-server/config.d/zero_copy_destructive_operations.xml
 fi
 
 # For flaky check we also enable thread fuzzer
@@ -216,11 +217,11 @@ export -f run_tests
 if [ "$NUM_TRIES" -gt "1" ]; then
     # We don't run tests with Ordinary database in PRs, only in master.
     # So run new/changed tests with Ordinary at least once in flaky check.
-    timeout "$MAX_RUN_TIME" bash -c 'NUM_TRIES=1; USE_DATABASE_ORDINARY=1; run_tests' \
+    timeout_with_logging "$MAX_RUN_TIME" bash -c 'NUM_TRIES=1; USE_DATABASE_ORDINARY=1; run_tests' \
       | sed 's/All tests have finished//' | sed 's/No tests were run//' ||:
 fi
 
-timeout "$MAX_RUN_TIME" bash -c run_tests ||:
+timeout_with_logging "$MAX_RUN_TIME" bash -c run_tests ||:
 
 echo "Files in current directory"
 ls -la ./
@@ -300,9 +301,6 @@ if [[ -n "$USE_DATABASE_REPLICATED" ]] && [[ "$USE_DATABASE_REPLICATED" -eq 1 ]]
     rg -Fa "<Fatal>" /var/log/clickhouse-server/clickhouse-server2.log ||:
     zstd --threads=0 < /var/log/clickhouse-server/clickhouse-server1.log > /test_output/clickhouse-server1.log.zst ||:
     zstd --threads=0 < /var/log/clickhouse-server/clickhouse-server2.log > /test_output/clickhouse-server2.log.zst ||:
-    # FIXME: remove once only github actions will be left
-    rm /var/log/clickhouse-server/clickhouse-server1.log
-    rm /var/log/clickhouse-server/clickhouse-server2.log
     mv /var/log/clickhouse-server/stderr1.log /test_output/ ||:
     mv /var/log/clickhouse-server/stderr2.log /test_output/ ||:
     tar -chf /test_output/coordination1.tar /var/lib/clickhouse1/coordination ||:
diff --git a/docker/test/stateless/utils.lib b/docker/test/stateless/utils.lib
index 1204434d853..9b6ab535a90 100644
--- a/docker/test/stateless/utils.lib
+++ b/docker/test/stateless/utils.lib
@@ -35,4 +35,17 @@ function fn_exists() {
     declare -F "$1" > /dev/null;
 }
 
+function timeout_with_logging() {
+    local exit_code=0
+
+    timeout "${@}" || exit_code="${?}"
+
+    if [[ "${exit_code}" -eq "124" ]]
+    then
+      echo "The command 'timeout ${*}' has been killed by timeout"
+    fi
+
+    return $exit_code
+}
+
 # vi: ft=bash
diff --git a/docker/test/stress/run.sh b/docker/test/stress/run.sh
index afc1a386a48..67056cc1bc1 100644
--- a/docker/test/stress/run.sh
+++ b/docker/test/stress/run.sh
@@ -65,9 +65,27 @@ chmod 777 -R /var/lib/clickhouse
 clickhouse-client --query "ATTACH DATABASE IF NOT EXISTS datasets ENGINE = Ordinary"
 clickhouse-client --query "CREATE DATABASE IF NOT EXISTS test"
 
+
 stop
 mv /var/log/clickhouse-server/clickhouse-server.log /var/log/clickhouse-server/clickhouse-server.initial.log
 
+# Randomize cache policies.
+cache_policy=""
+if [ $(( $(date +%-d) % 2 )) -eq 1 ]; then
+    cache_policy="SLRU"
+else
+    cache_policy="LRU"
+fi
+
+echo "Using cache policy: $cache_policy"
+
+if [ "$cache_policy" = "SLRU" ]; then
+    sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
+    | sed "s|<cache_policy>LRU</cache_policy>|<cache_policy>SLRU</cache_policy>|" \
+    > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
+    mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
+fi
+
 start
 
 clickhouse-client --query "SHOW TABLES FROM datasets"
@@ -191,6 +209,13 @@ sudo cat /etc/clickhouse-server/config.d/logger_trace.xml \
    > /etc/clickhouse-server/config.d/logger_trace.xml.tmp
 mv /etc/clickhouse-server/config.d/logger_trace.xml.tmp /etc/clickhouse-server/config.d/logger_trace.xml
 
+if [ "$cache_policy" = "SLRU" ]; then
+    sudo cat /etc/clickhouse-server/config.d/storage_conf.xml \
+    | sed "s|<cache_policy>LRU</cache_policy>|<cache_policy>SLRU</cache_policy>|" \
+    > /etc/clickhouse-server/config.d/storage_conf.xml.tmp
+    mv /etc/clickhouse-server/config.d/storage_conf.xml.tmp /etc/clickhouse-server/config.d/storage_conf.xml
+fi
+
 # Randomize async_load_databases
 if [ $(( $(date +%-d) % 2 )) -eq 1 ]; then
     sudo echo "<clickhouse><async_load_databases>true</async_load_databases></clickhouse>" \
diff --git a/docker/test/style/run.sh b/docker/test/style/run.sh
index 315efb9e6c4..cc6cb292b66 100755
--- a/docker/test/style/run.sh
+++ b/docker/test/style/run.sh
@@ -23,6 +23,7 @@ echo "Check submodules" | ts
 ./check-submodules            |& tee /test_output/submodules_output.txt
 echo "Check shell scripts with shellcheck" | ts
 ./shellcheck-run.sh           |& tee /test_output/shellcheck_output.txt
+
 /process_style_check_result.py || echo -e "failure\tCannot parse results" > /test_output/check_status.tsv
 echo "Check help for changelog generator works" | ts
 cd ../changelog || exit 1
diff --git a/docker/test/upgrade/run.sh b/docker/test/upgrade/run.sh
index 158ac19229e..f014fce49f6 100644
--- a/docker/test/upgrade/run.sh
+++ b/docker/test/upgrade/run.sh
@@ -77,6 +77,7 @@ remove_keeper_config "create_if_not_exists" "[01]"
 # it contains some new settings, but we can safely remove it
 rm /etc/clickhouse-server/config.d/merge_tree.xml
 rm /etc/clickhouse-server/config.d/enable_wait_for_shutdown_replicated_tables.xml
+rm /etc/clickhouse-server/config.d/zero_copy_destructive_operations.xml
 rm /etc/clickhouse-server/users.d/nonconst_timezone.xml
 rm /etc/clickhouse-server/users.d/s3_cache_new.xml
 rm /etc/clickhouse-server/users.d/replicated_ddl_entry.xml
@@ -115,6 +116,7 @@ sudo chgrp clickhouse /etc/clickhouse-server/config.d/s3_storage_policy_by_defau
 # it contains some new settings, but we can safely remove it
 rm /etc/clickhouse-server/config.d/merge_tree.xml
 rm /etc/clickhouse-server/config.d/enable_wait_for_shutdown_replicated_tables.xml
+rm /etc/clickhouse-server/config.d/zero_copy_destructive_operations.xml
 rm /etc/clickhouse-server/users.d/nonconst_timezone.xml
 rm /etc/clickhouse-server/users.d/s3_cache_new.xml
 rm /etc/clickhouse-server/users.d/replicated_ddl_entry.xml
diff --git a/docs/changelogs/v23.11.1.2711-stable.md b/docs/changelogs/v23.11.1.2711-stable.md
new file mode 100644
index 00000000000..e32dee41dc7
--- /dev/null
+++ b/docs/changelogs/v23.11.1.2711-stable.md
@@ -0,0 +1,525 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.11.1.2711-stable (05bc8ef1e02) FIXME as compared to v23.10.1.1976-stable (13adae0e42f)
+
+#### Backward Incompatible Change
+* Formatters `%l`/`%k`/`%c` in function `parseDateTime()` are now able to parse hours/months without leading zeros, e.g. `select parseDateTime('2023-11-26 8:14', '%F %k:%i')` now works. Set `parsedatetime_parse_without_leading_zeros = 0` to restore the previous behavior which required two digits. Function `formatDateTime` is now also able to print hours/months without leading zeros. This is controlled by setting `formatdatetime_format_without_leading_zeros` but off by default to not break existing use cases. [#55872](https://github.com/ClickHouse/ClickHouse/pull/55872) ([Azat Khuzhin](https://github.com/azat)).
+* You can no longer use the aggregate function `avgWeighted` with arguments of type `Decimal`. Workaround: convert arguments to `Float64`. This closes [#43928](https://github.com/ClickHouse/ClickHouse/issues/43928). This closes [#31768](https://github.com/ClickHouse/ClickHouse/issues/31768). This closes [#56435](https://github.com/ClickHouse/ClickHouse/issues/56435). If you have used this function inside materialized views or projections with `Decimal` arguments, contact support@clickhouse.com. Fixed error in aggregate function `sumMap` and made it slower around 1.5..2 times. It does not matter because the function is garbage anyway. This closes [#54955](https://github.com/ClickHouse/ClickHouse/issues/54955). This closes [#53134](https://github.com/ClickHouse/ClickHouse/issues/53134). This closes [#55148](https://github.com/ClickHouse/ClickHouse/issues/55148). Fix a bug in function `groupArraySample` - it used the same random seed in case more than one aggregate state is generated in a query. [#56350](https://github.com/ClickHouse/ClickHouse/pull/56350) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The default ClickHouse server configuration file has enabled `access_management` (user manipulation by SQL queries) and `named_collection_control` (manipulation of named collection by SQL queries) for the `default` user by default. This closes [#56482](https://github.com/ClickHouse/ClickHouse/issues/56482). [#56619](https://github.com/ClickHouse/ClickHouse/pull/56619) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Multiple improvements for RESPECT/IGNORE NULLS. [#57189](https://github.com/ClickHouse/ClickHouse/pull/57189) ([Raúl Marín](https://github.com/Algunenano)).
+* Remove optimization optimize_move_functions_out_of_any. [#57190](https://github.com/ClickHouse/ClickHouse/pull/57190) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### New Feature
+* Added server setting `async_load_databases` for asynchronous loading of databases and tables. Speeds up the server start time. Applies to databases with Ordinary, Atomic and Replicated engines. Their tables load metadata asynchronously. Query to a table increases the priority of the load job and waits for it to be done. Added table `system.async_loader`. [#49351](https://github.com/ClickHouse/ClickHouse/pull/49351) ([Sergei Trifonov](https://github.com/serxa)).
+* 1. Add function `extractPlainRanges` to `KeyCondition`. 2. Add some useful functions to `Range` 3. Add `PlainRanges` who represent a serious of ranges that ordered and no overlapping. 4. Add `NumbersRangedSource` who can accurately return user selected numbers. [#50909](https://github.com/ClickHouse/ClickHouse/pull/50909) ([JackyWoo](https://github.com/JackyWoo)).
+* Add system table `blob_storage_log`. [#52918](https://github.com/ClickHouse/ClickHouse/pull/52918) ([vdimir](https://github.com/vdimir)).
+* Use statistic to order prewhere conditions better. [#53240](https://github.com/ClickHouse/ClickHouse/pull/53240) ([Han Fei](https://github.com/hanfei1991)).
+* Added a new aggregation function `groupArraySorted(n)(value)` which returns an array with the n first values from a field value sorted by itself. [#53562](https://github.com/ClickHouse/ClickHouse/pull/53562) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Added support for compression in keeper protocol. Can be enabled on clickhouse by using this flag `use_compression` inside `zookeeper`. resolves [#49507](https://github.com/ClickHouse/ClickHouse/issues/49507). [#54957](https://github.com/ClickHouse/ClickHouse/pull/54957) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Add ClickHouse setting to disable tunneling for HTTPS requests over HTTP proxy. [#55033](https://github.com/ClickHouse/ClickHouse/pull/55033) ([Arthur Passos](https://github.com/arthurpassos)).
+* Introduce the feature `storage_metadata_write_full_object_key`. If it is set as `true` then metadata files are written with new format VERSION_FULL_OBJECT_KEY. With that format CH stores full remote object key in the metadata file. [#55566](https://github.com/ClickHouse/ClickHouse/pull/55566) ([Sema Checherinda](https://github.com/CheSema)).
+* Add new settings and syntax to protect named collections' fields from being overridden. This is meant to prevent a malicious user from obtaining unauthorized access to secrets. [#55782](https://github.com/ClickHouse/ClickHouse/pull/55782) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Add `hostname` column to all system log tables;. [#55894](https://github.com/ClickHouse/ClickHouse/pull/55894) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add `CHECK ALL TABLES` query. [#56022](https://github.com/ClickHouse/ClickHouse/pull/56022) ([vdimir](https://github.com/vdimir)).
+* Added function `fromDaysSinceYearZero()` which is similar to MySQL's `FROM_DAYS`. E.g. `SELECT fromDaysSinceYearZero(739136)` returns `2023-09-08`. [#56088](https://github.com/ClickHouse/ClickHouse/pull/56088) ([Joanna Hulboj](https://github.com/jh0x)).
+* Implemented series period detect method using FFT in pocketFFT lib. [#56171](https://github.com/ClickHouse/ClickHouse/pull/56171) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Add an external Python tool to view backups and to extract information from them without using ClickHouse. [#56268](https://github.com/ClickHouse/ClickHouse/pull/56268) ([Vitaly Baranov](https://github.com/vitlibar)).
+* ... [#56275](https://github.com/ClickHouse/ClickHouse/pull/56275) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* This pull request implements new setting called `preferred_projection_name`. If it is set to a non-empty string, the specified projection would be used if possible. [#56309](https://github.com/ClickHouse/ClickHouse/pull/56309) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* S3 adaptive timeout means that first attempt made with low send and receive timeouts. [#56314](https://github.com/ClickHouse/ClickHouse/pull/56314) ([Sema Checherinda](https://github.com/CheSema)).
+* Add 4-letter command for yielding/resigning leadership (https://github.com/ClickHouse/ClickHouse/issues/56352). [#56354](https://github.com/ClickHouse/ClickHouse/pull/56354) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Added a new SQL function, "arrayRandomSample(arr, k)" which returns a sample of k elements from the input array. Similar functionality could previously be achieved only with less convenient syntax, e.g. "SELECT arrayReduce('groupArraySample(3)', range(10))". [#56416](https://github.com/ClickHouse/ClickHouse/pull/56416) ([Robert Schulze](https://github.com/rschu1ze)).
+* Added support for `float16` type data to use in `.npy` files. Closes [#56344](https://github.com/ClickHouse/ClickHouse/issues/56344). [#56424](https://github.com/ClickHouse/ClickHouse/pull/56424) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Added system view `information_schema.statistics` for better compatibility with Tableau Online. [#56425](https://github.com/ClickHouse/ClickHouse/pull/56425) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Add function `getClientHTTPHeader` for fetching values header values set in the HTTP request. [#56488](https://github.com/ClickHouse/ClickHouse/pull/56488) ([凌涛](https://github.com/lingtaolf)).
+* Add a new table function named `fuzzJSON` with rows containing perturbed versions of the source JSON string with random variations. [#56490](https://github.com/ClickHouse/ClickHouse/pull/56490) ([Julia Kartseva](https://github.com/jkartseva)).
+* Add `system.symbols` table useful for introspection of the binary. [#56548](https://github.com/ClickHouse/ClickHouse/pull/56548) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add 4-letter command for yielding/resigning leadership. [#56620](https://github.com/ClickHouse/ClickHouse/pull/56620) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Configurable dashboards. Queries for charts are now loaded using a query, which by default uses a new `system.dashboards` table. [#56771](https://github.com/ClickHouse/ClickHouse/pull/56771) ([Sergei Trifonov](https://github.com/serxa)).
+* Introduce `fileCluster` table function. [#56868](https://github.com/ClickHouse/ClickHouse/pull/56868) ([Andrey Zvonov](https://github.com/zvonand)).
+* Add `_size` virtual column with file size in bytes to `s3/file/hdfs/url/azureBlobStorage` engines. [#57126](https://github.com/ClickHouse/ClickHouse/pull/57126) ([Kruglov Pavel](https://github.com/Avogar)).
+* Expose the number of errors occurred on a server since last restart from the Prometheus endpoint. [#57209](https://github.com/ClickHouse/ClickHouse/pull/57209) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Added a new SQL function `sqid` to generate Sqids (https://sqids.org/), example: `SELECT sqid(125, 126)`. [#57442](https://github.com/ClickHouse/ClickHouse/pull/57442) ([awakeljw](https://github.com/awakeljw)).
+
+#### Performance Improvement
+* Support window functions parallel evaluation. Fixes [#34688](https://github.com/ClickHouse/ClickHouse/issues/34688). [#39631](https://github.com/ClickHouse/ClickHouse/pull/39631) ([Dmitry Novik](https://github.com/novikd)).
+* Increase the default value of `max_concurrent_queries` from 100 to 1000. This makes sense when there is a large number of connecting clients, which are slowly sending or receiving data, so the server is not limited by CPU, or when the number of CPU cores is larger than 100. Also, enable the concurrency control by default, and set the desired number of query processing threads in total as twice the number of CPU cores. It improves performance in scenarios with a very large number of concurrent queries. [#46927](https://github.com/ClickHouse/ClickHouse/pull/46927) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fixed filtering by `IN(...)` condition for `Merge` table engine. [#54905](https://github.com/ClickHouse/ClickHouse/pull/54905) ([Nikita Taranov](https://github.com/nickitat)).
+* An improvement which takes place when cache is full and there are big reads. [#55158](https://github.com/ClickHouse/ClickHouse/pull/55158) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add ability to disable checksums for S3 to avoid excessive input file read (this new behavior could be enabled with `s3_disable_checksum=true`). [#55559](https://github.com/ClickHouse/ClickHouse/pull/55559) ([Azat Khuzhin](https://github.com/azat)).
+* Now we read synchronously from remote tables when data is in page cache (like we do for local tables). It is faster, doesn't require synchronisation inside thread pool, doesn't hesitate to do `seek`-s on local fs and reduces cpu wait. [#55841](https://github.com/ClickHouse/ClickHouse/pull/55841) ([Nikita Taranov](https://github.com/nickitat)).
+* ... This PR follows [#55929](https://github.com/ClickHouse/ClickHouse/issues/55929), it will bring about 30% speedup. - reduce the reserved memory - reduce the `resize` call. [#55957](https://github.com/ClickHouse/ClickHouse/pull/55957) ([lgbo](https://github.com/lgbo-ustc)).
+* The performance experiments of **OnTime** on the ICX device (Intel Xeon Platinum 8380 CPU, 80 cores, 160 threads) show that this change could bring the improvements of **7.4%, 5.9%, 4.7%, 3.0%, and 4.6%** to the QPS of the query Q2, Q3, Q4, Q5 and Q6 respectively while having no impact on others. [#56079](https://github.com/ClickHouse/ClickHouse/pull/56079) ([Zhiguo Zhou](https://github.com/ZhiguoZh)).
+* Limit the number of threads busy inside the query profiler. If there are more - they will skip profiling. [#56105](https://github.com/ClickHouse/ClickHouse/pull/56105) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* WindowTransform decrease amount of virtual function calls. [#56120](https://github.com/ClickHouse/ClickHouse/pull/56120) ([Maksim Kita](https://github.com/kitaisreal)).
+* Allow recursive tuple field pruning in ORC to speed up scaning. [#56122](https://github.com/ClickHouse/ClickHouse/pull/56122) ([李扬](https://github.com/taiyang-li)).
+* This pull request provides countRows support for Npy data format. Now with setting `optimize_count_from_files=1` queries like `select count() from file(data.npy)` will work much more fast because of caching the results. [#56304](https://github.com/ClickHouse/ClickHouse/pull/56304) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Queries with aggregation and a large number of streams will use less amount of memory during the plan's construction. [#57074](https://github.com/ClickHouse/ClickHouse/pull/57074) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Improve performance of executing queries for use cases with many users. [#57106](https://github.com/ClickHouse/ClickHouse/pull/57106) ([Andrej Hoos](https://github.com/adikus)).
+* Trivial improvement on array join, reuse some intermediate results. [#57183](https://github.com/ClickHouse/ClickHouse/pull/57183) ([李扬](https://github.com/taiyang-li)).
+* There are cases when stack unwinding was slow. [#57221](https://github.com/ClickHouse/ClickHouse/pull/57221) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Now we use default read pool for reading from external storage when `max_streams = 1`. It is beneficial when read prefetches are enabled. [#57334](https://github.com/ClickHouse/ClickHouse/pull/57334) ([Nikita Taranov](https://github.com/nickitat)).
+
+#### Improvement
+* Engine `Merge` filters the records according to the row policies of the underlying tables. [#50209](https://github.com/ClickHouse/ClickHouse/pull/50209) ([Ilya Golshtein](https://github.com/ilejn)).
+* Add a setting `max_execution_time_leaf` to limit the execution time on shard for distributed query, and `timeout_overflow_mode_leaf` to control the behaviour if timeout happens. [#51823](https://github.com/ClickHouse/ClickHouse/pull/51823) ([Duc Canh Le](https://github.com/canhld94)).
+* Fix possible postgresql logical replication conversion_error when using MaterializedPostgreSQL. [#53721](https://github.com/ClickHouse/ClickHouse/pull/53721) ([takakawa](https://github.com/takakawa)).
+* Set `background_fetches_pool_size` to 16, background_schedule_pool_size to 512 that is better for production usage with frequent small insertions. [#54327](https://github.com/ClickHouse/ClickHouse/pull/54327) ([Denny Crane](https://github.com/den-crane)).
+* While read data from a csv format file, and at end of line is'\r' , which not followed by '\n', then we will enconter the exception as below ``` Cannot parse CSV format: found \r (CR) not followed by \n (LF). Line must end by \n (LF) or \r\n (CR LF) or \n\r.: ``` In clickhouse, the csv end of line must be \n or \r\n or \n\r, so the \r must be followed by \n , but in some suitation, the csv input data is abnormal, like above, \r is at end of line. [#54340](https://github.com/ClickHouse/ClickHouse/pull/54340) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Update arrow library to release-13.0.0 that supports new encodings. Closes [#44505](https://github.com/ClickHouse/ClickHouse/issues/44505). [#54800](https://github.com/ClickHouse/ClickHouse/pull/54800) ([Kruglov Pavel](https://github.com/Avogar)).
+* Improve performance of ON CLUSTER queries by removing heavy system calls to get all network interfaces when looking for local ip address in the DDL entry hosts list. [#54909](https://github.com/ClickHouse/ClickHouse/pull/54909) ([Duc Canh Le](https://github.com/canhld94)).
+* Keeper improvement: improve memory-usage during startup by delaying log preprocessing. [#55660](https://github.com/ClickHouse/ClickHouse/pull/55660) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fixed accounting of memory allocated before attaching thread to a query or a user. [#56089](https://github.com/ClickHouse/ClickHouse/pull/56089) ([Nikita Taranov](https://github.com/nickitat)).
+* ClickHouse keeper reports its running availability zone at `/keeper/availability-zone` path, when running on AWS environment. [#56104](https://github.com/ClickHouse/ClickHouse/pull/56104) ([Jianfei Hu](https://github.com/incfly)).
+* Add support for LARGE_LIST with Arrow. [#56118](https://github.com/ClickHouse/ClickHouse/pull/56118) ([edef](https://github.com/edef1c)).
+* Improved performance of glob matching for `file` and `hdfs` storages. [#56141](https://github.com/ClickHouse/ClickHouse/pull/56141) ([Andrey Zvonov](https://github.com/zvonand)).
+* Allow manual compaction of `EmbeddedRocksDB` via `OPTIMIZE` query. [#56225](https://github.com/ClickHouse/ClickHouse/pull/56225) ([Azat Khuzhin](https://github.com/azat)).
+* Posting lists in inverted indexes are now compressed which reduces their size by 10-30%. [#56226](https://github.com/ClickHouse/ClickHouse/pull/56226) ([Harry Lee](https://github.com/HarryLeeIBM)).
+* Add ability to specify BlockBasedTableOptions for EmbeddedRocksDB. [#56264](https://github.com/ClickHouse/ClickHouse/pull/56264) ([Azat Khuzhin](https://github.com/azat)).
+* `SHOW COLUMNS` now displays MySQL's equivalent data type name when the connection was made through the MySQL protocol. Previously, this was the case when setting `use_mysql_types_in_show_columns = 1`. The setting is retained but made obsolete. [#56277](https://github.com/ClickHouse/ClickHouse/pull/56277) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fixed possible `The local set of parts of table doesn't look like the set of parts in ZooKeeper` error if server was restarted just after `TRUNCATE` or `DROP PARTITION`. [#56282](https://github.com/ClickHouse/ClickHouse/pull/56282) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Parallelise `BackupEntriesCollector`. [#56312](https://github.com/ClickHouse/ClickHouse/pull/56312) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fixed handling of non-const query strings in functions `formatQuery()`/ `formatQuerySingleLine()`. Also added `OrNull` variants of both functions that return a NULL when a query cannot be parsed instead of throwing an exception. [#56327](https://github.com/ClickHouse/ClickHouse/pull/56327) ([Robert Schulze](https://github.com/rschu1ze)).
+* Support create and materialized index in the same alter query, also support modity TTL and materialize TTL in the same query. Closes [#55651](https://github.com/ClickHouse/ClickHouse/issues/55651). [#56331](https://github.com/ClickHouse/ClickHouse/pull/56331) ([flynn](https://github.com/ucasfl)).
+* Enable adding new disk to storage configuration without restart. [#56367](https://github.com/ClickHouse/ClickHouse/pull/56367) ([Duc Canh Le](https://github.com/canhld94)).
+* Allow backup of materialized view with dropped inner table instead of failing the backup. [#56387](https://github.com/ClickHouse/ClickHouse/pull/56387) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Queries to `system.replicas` initiate requests to ZooKeeper when certain columns are queried. When there are thousands of tables these requests might produce a considerable load on ZooKeeper. If there are multiple simultaneous queries to `system.replicas` they do same requests multiple times. The change is to "deduplicate" requests from concurrent queries. [#56420](https://github.com/ClickHouse/ClickHouse/pull/56420) ([Alexander Gololobov](https://github.com/davenger)).
+* Add transition from reading key to reading quoted key when double quotes are found. [#56423](https://github.com/ClickHouse/ClickHouse/pull/56423) ([Arthur Passos](https://github.com/arthurpassos)).
+* Fix transfer query to MySQL compatible query. [#56456](https://github.com/ClickHouse/ClickHouse/pull/56456) ([flynn](https://github.com/ucasfl)).
+* Add support for backing up and restoring tables using KeeperMap engine. [#56460](https://github.com/ClickHouse/ClickHouse/pull/56460) ([Antonio Andelic](https://github.com/antonio2368)).
+* 404 response for CompleteMultipartUpload has to be rechecked. Operation could be done on server even if client got timeout or other network errors. The next retry of CompleteMultipartUpload receives 404 response. If the object key exists that operation is considered as successful. [#56475](https://github.com/ClickHouse/ClickHouse/pull/56475) ([Sema Checherinda](https://github.com/CheSema)).
+* Enable the HTTP OPTIONS method by default - it simplifies requesting ClickHouse from a web browser. [#56483](https://github.com/ClickHouse/ClickHouse/pull/56483) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The value for `dns_max_consecutive_failures` was changed by mistake in [#46550](https://github.com/ClickHouse/ClickHouse/issues/46550) - this is reverted and adjusted to a better value. Also, increased the HTTP keep-alive timeout to a reasonable value from production. [#56485](https://github.com/ClickHouse/ClickHouse/pull/56485) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Load base backups lazily (a base backup won't be loaded until it's needed). Also add some log message and profile events for backups. [#56516](https://github.com/ClickHouse/ClickHouse/pull/56516) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Setting `query_cache_store_results_of_queries_with_nondeterministic_functions` (with values `false` or `true`) was marked obsolete. It was replaced by setting `query_cache_nondeterministic_function_handling`, a three-valued enum that controls how the query cache handles queries with non-deterministic functions: a) throw an exception (default behavior), b) save the non-deterministic query result regardless, or c) ignore, i.e. don't throw an exception and don't cache the result. [#56519](https://github.com/ClickHouse/ClickHouse/pull/56519) ([Robert Schulze](https://github.com/rschu1ze)).
+* Rewrite equality with `is null` check in JOIN ON section. *Analyzer only*. [#56538](https://github.com/ClickHouse/ClickHouse/pull/56538) ([vdimir](https://github.com/vdimir)).
+* Function`concat` now supports arbitrary argument types (instead of only String and FixedString arguments). This makes it behave more similar to MySQL `concat` implementation. For example, `SELECT concat('ab', 42)` now returns `ab42`. [#56540](https://github.com/ClickHouse/ClickHouse/pull/56540) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Allow getting cache configuration from 'named_collection' section in config or from sql created named collection. [#56541](https://github.com/ClickHouse/ClickHouse/pull/56541) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update `query_masking_rules` when reloading the config ([#56449](https://github.com/ClickHouse/ClickHouse/issues/56449)). [#56573](https://github.com/ClickHouse/ClickHouse/pull/56573) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Make removeoutdatedtables() less aggressive with unsuccessful postgres connection. [#56609](https://github.com/ClickHouse/ClickHouse/pull/56609) ([jsc0218](https://github.com/jsc0218)).
+* Currenting setting takes too much time to connnect to PG when URL is not right, so the relevant query stucks there and get cancelled. [#56648](https://github.com/ClickHouse/ClickHouse/pull/56648) ([jsc0218](https://github.com/jsc0218)).
+* ClickHouse keeper reports its running availability zone at `/keeper/availability-zone` path. This can be configured via `<availability_zone><value>us-west-1a</value></availability_zone>`. [#56715](https://github.com/ClickHouse/ClickHouse/pull/56715) ([Jianfei Hu](https://github.com/incfly)).
+* Do not allow tables on different replicas have different aggregate functions in SimpleAggregateFunction columns. [#56724](https://github.com/ClickHouse/ClickHouse/pull/56724) ([Duc Canh Le](https://github.com/canhld94)).
+* Add support for the [well-known Protobuf types](https://protobuf.dev/reference/protobuf/google.protobuf/) in the Protobuf format. [#56741](https://github.com/ClickHouse/ClickHouse/pull/56741) ([János Benjamin Antal](https://github.com/antaljanosbenjamin)).
+* Keeper improvement: disable compressed logs by default in Keeper. [#56763](https://github.com/ClickHouse/ClickHouse/pull/56763) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add config setting `wait_dictionaries_load_at_startup`:. [#56782](https://github.com/ClickHouse/ClickHouse/pull/56782) ([Vitaly Baranov](https://github.com/vitlibar)).
+* There was a potential vulnerability in previous ClickHouse versions: if a user has connected and unsuccessfully tried to authenticate with the "interserver secret" method, the server didn't terminate the connection immediately but continued to receive and ignore the leftover packets from the client. While these packets are ignored, they are still parsed, and if they use a compression method with another known vulnerability, it will lead to exploitation of it without authentication. This issue was found with [ClickHouse Bug Bounty Program](https://github.com/ClickHouse/ClickHouse/issues/38986) by https://twitter.com/malacupa. [#56794](https://github.com/ClickHouse/ClickHouse/pull/56794) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fetching a part waits when that part is fully committed on remote replica. It is better not send part in PreActive state. In case of zero copy this is mandatory restriction. [#56808](https://github.com/ClickHouse/ClickHouse/pull/56808) ([Sema Checherinda](https://github.com/CheSema)).
+* Implement user-level setting `alter_move_to_space_execute_async` which allow to execute queries `ALTER TABLE ... MOVE PARTITION|PART TO DISK|VOLUME` asynchronously. The size of pool for background executions is controlled by `background_move_pool_size`. Default behavior is synchronous execution. Fixes [#47643](https://github.com/ClickHouse/ClickHouse/issues/47643). [#56809](https://github.com/ClickHouse/ClickHouse/pull/56809) ([alesapin](https://github.com/alesapin)).
+* Able to filter by engine when scanning system.tables, avoid unnecessary (potentially time-consuming) connection. [#56813](https://github.com/ClickHouse/ClickHouse/pull/56813) ([jsc0218](https://github.com/jsc0218)).
+* Show `total_bytes` and `total_rows` in system tables for RocksDB storage. [#56816](https://github.com/ClickHouse/ClickHouse/pull/56816) ([Aleksandr Musorin](https://github.com/AVMusorin)).
+* Allow basic commands in ALTER for TEMPORARY tables. [#56892](https://github.com/ClickHouse/ClickHouse/pull/56892) ([Sergey](https://github.com/icuken)).
+* Lz4 compression. Buffer compressed block in a rare case when out buffer capacity is not enough for writing compressed block directly to out's buffer. [#56938](https://github.com/ClickHouse/ClickHouse/pull/56938) ([Sema Checherinda](https://github.com/CheSema)).
+* Add metrics for the number of queued jobs, which is useful for the IO thread pool. [#56958](https://github.com/ClickHouse/ClickHouse/pull/56958) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add a setting for PostgreSQL table engine setting in the config file Added a check for the setting Added documentation around the additional setting. [#56959](https://github.com/ClickHouse/ClickHouse/pull/56959) ([Peignon Melvyn](https://github.com/melvynator)).
+* Run interpreter with `only_analyze` flag in getsampleblock method. [#56972](https://github.com/ClickHouse/ClickHouse/pull/56972) ([Mikhail Artemenko](https://github.com/Michicosun)).
+* Add a new `MergeTree` setting `add_implicit_sign_column_constraint_for_collapsing_engine` (disabled by default). When enabled, it adds an implicit CHECK constraint for `CollapsingMergeTree` tables that restricts the value of the `Sign` column to be only -1 or 1. [#56701](https://github.com/ClickHouse/ClickHouse/issues/56701). [#56986](https://github.com/ClickHouse/ClickHouse/pull/56986) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
+* Function `concat()` can now be called with a single argument, e.g., `SELECT concat('abc')`. This makes its behavior more consistent with MySQL's concat implementation. [#57000](https://github.com/ClickHouse/ClickHouse/pull/57000) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Signs all `x-amz-*` headers as required by AWS S3 docs. [#57001](https://github.com/ClickHouse/ClickHouse/pull/57001) ([Arthur Passos](https://github.com/arthurpassos)).
+* Function `fromDaysSinceYearZero` (alias: `FROM_DAYS`) can now be used with unsigned and signed integer types (previously, it had to be an unsigned integer). This improve compatibility with 3rd party tools such as Tableau Online. [#57002](https://github.com/ClickHouse/ClickHouse/pull/57002) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Add system.s3queue_log to default config. [#57036](https://github.com/ClickHouse/ClickHouse/pull/57036) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Change the default for `wait_dictionaries_load_at_startup` to true, and use this setting only if `dictionaries_lazy_load` is false. [#57133](https://github.com/ClickHouse/ClickHouse/pull/57133) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Check dictionary source type on creation even if `dictionaries_lazy_load` is enabled. [#57134](https://github.com/ClickHouse/ClickHouse/pull/57134) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Plan-level optimizations can now be enabled/disabled individually. Previously, it was only possible to disable them all. The setting which previously did that (`query_plan_enable_optimizations`) is retained and can still be used to disable all optimizations. [#57152](https://github.com/ClickHouse/ClickHouse/pull/57152) ([Robert Schulze](https://github.com/rschu1ze)).
+* The server's exit code will correspond to the exception code. For example, if the server cannot start due to memory limit, it will exit with the code 241 = MEMORY_LIMIT_EXCEEDED. In previous versions, the exit code for exceptions was always 70 = Poco::Util::ExitCode::EXIT_SOFTWARE. [#57153](https://github.com/ClickHouse/ClickHouse/pull/57153) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Do not demangle and symbolize stack frames from __functional c++ header. [#57201](https://github.com/ClickHouse/ClickHouse/pull/57201) ([Mike Kot](https://github.com/myrrc)).
+* It is now possible to refer to ALIAS column in index (non-primary-key) definitions (issue [#55650](https://github.com/ClickHouse/ClickHouse/issues/55650)). Example: `CREATE TABLE tab(col UInt32, col_alias ALIAS col + 1, INDEX idx (col_alias) TYPE minmax) ENGINE = MergeTree ORDER BY col;`. [#57220](https://github.com/ClickHouse/ClickHouse/pull/57220) ([flynn](https://github.com/ucasfl)).
+* HTTP server page `/dashboard` now supports charts with multiple lines. [#57236](https://github.com/ClickHouse/ClickHouse/pull/57236) ([Sergei Trifonov](https://github.com/serxa)).
+* This pr gives possibility to use suffixes (K, M, G, T, E) along with the amount of memory to be used. Closes [#56879](https://github.com/ClickHouse/ClickHouse/issues/56879). [#57273](https://github.com/ClickHouse/ClickHouse/pull/57273) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Bumped Intel QPL (used by codec `DEFLATE_QPL`) from v1.2.0 to v1.3.1 . Also fixed a bug in case of BOF (Block On Fault) = 0, changed to handle page faults by falling back to SW path. [#57291](https://github.com/ClickHouse/ClickHouse/pull/57291) ([jasperzhu](https://github.com/jinjunzh)).
+* Make alter materialized view non experimental and deprecate `allow_experimental_alter_materialized_view_structure` setting. Fixes [#15206](https://github.com/ClickHouse/ClickHouse/issues/15206). [#57311](https://github.com/ClickHouse/ClickHouse/pull/57311) ([alesapin](https://github.com/alesapin)).
+* Increase default `replicated_deduplication_window` of MergeTree settings from 100 to 1k. [#57335](https://github.com/ClickHouse/ClickHouse/pull/57335) ([sichenzhao](https://github.com/sichenzhao)).
+* Stop using `INCONSISTENT_METADATA_FOR_BACKUP` that much. If possible prefer to continue scanning instead of stopping and starting the scanning for backup from the beginning. [#57385](https://github.com/ClickHouse/ClickHouse/pull/57385) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Introduce the limit for the maximum number of table projections (default 25). [#57491](https://github.com/ClickHouse/ClickHouse/pull/57491) ([Julia Kartseva](https://github.com/jkartseva)).
+* Enable `async_block_ids_cache` by default for `async_inserts` deduplication. [#57513](https://github.com/ClickHouse/ClickHouse/pull/57513) ([alesapin](https://github.com/alesapin)).
+
+#### Build/Testing/Packaging Improvement
+* Enable temporary_data_in_cache in s3 tests in CI. [#48425](https://github.com/ClickHouse/ClickHouse/pull/48425) ([vdimir](https://github.com/vdimir)).
+* Run sqllogic test. [#56078](https://github.com/ClickHouse/ClickHouse/pull/56078) ([Han Fei](https://github.com/hanfei1991)).
+* Add a new build option `SANITIZE_COVERAGE`. If it is enabled, the code is instrumented to track the coverage. The collected information is available inside ClickHouse with: (1) a new function `coverage` that returns an array of unique addresses in the code found after the previous coverage reset; (2) `SYSTEM RESET COVERAGE` query that resets the accumulated data. This allows us to compare the coverage of different tests, including differential code coverage. Continuation of [#20539](https://github.com/ClickHouse/ClickHouse/issues/20539). [#56102](https://github.com/ClickHouse/ClickHouse/pull/56102) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* In [#54043](https://github.com/ClickHouse/ClickHouse/issues/54043) the setup plan started to appear in the logs. It should be only in the `runner_get_all_tests.log` only. As well, send the failed infrastructure event to CI db. [#56214](https://github.com/ClickHouse/ClickHouse/pull/56214) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Some of the stack frames might not be resolved when collecting stacks. In such cases the raw address might be helpful. [#56267](https://github.com/ClickHouse/ClickHouse/pull/56267) ([Alexander Gololobov](https://github.com/davenger)).
+* Add an option to disable libssh. [#56333](https://github.com/ClickHouse/ClickHouse/pull/56333) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add automatic check that there are no large translation units. [#56559](https://github.com/ClickHouse/ClickHouse/pull/56559) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Lower the size of the single-binary distribution. This closes [#55181](https://github.com/ClickHouse/ClickHouse/issues/55181). [#56617](https://github.com/ClickHouse/ClickHouse/pull/56617) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Make `clickhouse-local` and `clickhouse-client` available under short names (`ch`, `chl`, `chc`) for usability. [#56634](https://github.com/ClickHouse/ClickHouse/pull/56634) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Information about the sizes of every translation unit and binary file after each build will be sent to the CI database in ClickHouse Cloud. This closes [#56107](https://github.com/ClickHouse/ClickHouse/issues/56107). [#56636](https://github.com/ClickHouse/ClickHouse/pull/56636) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Certain files of "Apache Arrow" library (which we use only for non-essential things like parsing the arrow format) were rebuilt all the time regardless of the build cache. This is fixed. [#56657](https://github.com/ClickHouse/ClickHouse/pull/56657) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Avoid recompiling translation units depending on the autogenerated source file about version. [#56660](https://github.com/ClickHouse/ClickHouse/pull/56660) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Do not fetch changed submodules in the builder container. [#56689](https://github.com/ClickHouse/ClickHouse/pull/56689) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Tracing data of the linker invocations will be sent to the CI database in ClickHouse Cloud. [#56725](https://github.com/ClickHouse/ClickHouse/pull/56725) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Use DWARF 5 debug symbols for the clickhouse binary (was DWARF 4 previously). [#56770](https://github.com/ClickHouse/ClickHouse/pull/56770) ([Michael Kolupaev](https://github.com/al13n321)).
+* Optimized build size further by removing unused code from external libraries. [#56786](https://github.com/ClickHouse/ClickHouse/pull/56786) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Set memory usage for client (`1G`) to address problems like this: https://s3.amazonaws.com/clickhouse-test-reports/0/f1bf3f1fc39f520871ec878d815e515e12fd3e7b/fuzzer_astfuzzertsan/report.html. [#56873](https://github.com/ClickHouse/ClickHouse/pull/56873) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* There was an attempt to have the proper listing in [#44311](https://github.com/ClickHouse/ClickHouse/issues/44311), but the fix itself was in the wrong place, so it's still broken. See an [example](https://github.com/ClickHouse/ClickHouse/actions/runs/6897342568/job/18781001022#step:8:25). [#56989](https://github.com/ClickHouse/ClickHouse/pull/56989) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fixed the memory leak in integration test of postgres dictionary. The case of network partition is not correctly handled at the time of the repo pulled years ago. [#57231](https://github.com/ClickHouse/ClickHouse/pull/57231) ([jsc0218](https://github.com/jsc0218)).
+* Fix a test filename typo. [#57272](https://github.com/ClickHouse/ClickHouse/pull/57272) ([jsc0218](https://github.com/jsc0218)).
+* Fix issue caught in https://github.com/docker-library/official-images/pull/15846. [#57571](https://github.com/ClickHouse/ClickHouse/pull/57571) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix analyzer - insertion from select with subquery referencing insertion table should process only insertion block. [#50857](https://github.com/ClickHouse/ClickHouse/pull/50857) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Setting JoinAlgorithm respect specified order [#51745](https://github.com/ClickHouse/ClickHouse/pull/51745) ([vdimir](https://github.com/vdimir)).
+* Keeper `reconfig`: add timeout before yielding/taking leadership [#53481](https://github.com/ClickHouse/ClickHouse/pull/53481) ([Mike Kot](https://github.com/myrrc)).
+* Fix incorrect header in grace hash join and filter pushdown [#53922](https://github.com/ClickHouse/ClickHouse/pull/53922) ([vdimir](https://github.com/vdimir)).
+* Select from system tables when table based on table function. [#55540](https://github.com/ClickHouse/ClickHouse/pull/55540) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* RFC: Fix "Cannot find column X in source stream" for Distributed queries with LIMIT BY [#55836](https://github.com/ClickHouse/ClickHouse/pull/55836) ([Azat Khuzhin](https://github.com/azat)).
+* Fix 'Cannot read from file:' while running client in a background [#55976](https://github.com/ClickHouse/ClickHouse/pull/55976) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix clickhouse-local exit on bad send_logs_level setting [#55994](https://github.com/ClickHouse/ClickHouse/pull/55994) ([Kruglov Pavel](https://github.com/Avogar)).
+* Bug fix explain ast with parameterized view [#56004](https://github.com/ClickHouse/ClickHouse/pull/56004) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Fix a crash during table loading on startup [#56232](https://github.com/ClickHouse/ClickHouse/pull/56232) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix ClickHouse-sourced dictionaries with an explicit query [#56236](https://github.com/ClickHouse/ClickHouse/pull/56236) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix segfault in signal handler for Keeper [#56266](https://github.com/ClickHouse/ClickHouse/pull/56266) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix incomplete query result for UNION in view() function. [#56274](https://github.com/ClickHouse/ClickHouse/pull/56274) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix inconsistency of "cast('0' as DateTime64(3))" and "cast('0' as Nullable(DateTime64(3)))" [#56286](https://github.com/ClickHouse/ClickHouse/pull/56286) ([李扬](https://github.com/taiyang-li)).
+* Fix rare race condition related to Memory allocation failure [#56303](https://github.com/ClickHouse/ClickHouse/pull/56303) ([alesapin](https://github.com/alesapin)).
+* Fix restore from backup with `flatten_nested` and `data_type_default_nullable` [#56306](https://github.com/ClickHouse/ClickHouse/pull/56306) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix crash in case of adding a column with type Object(JSON) [#56307](https://github.com/ClickHouse/ClickHouse/pull/56307) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix crash in filterPushDown [#56380](https://github.com/ClickHouse/ClickHouse/pull/56380) ([vdimir](https://github.com/vdimir)).
+* Fix restore from backup with mat view and dropped source table [#56383](https://github.com/ClickHouse/ClickHouse/pull/56383) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix segfault during Kerberos initialization [#56401](https://github.com/ClickHouse/ClickHouse/pull/56401) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix buffer overflow in T64 [#56434](https://github.com/ClickHouse/ClickHouse/pull/56434) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix nullable primary key in final (2) [#56452](https://github.com/ClickHouse/ClickHouse/pull/56452) ([Amos Bird](https://github.com/amosbird)).
+* Fix ON CLUSTER queries without database on initial node [#56484](https://github.com/ClickHouse/ClickHouse/pull/56484) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix startup failure due to TTL dependency [#56489](https://github.com/ClickHouse/ClickHouse/pull/56489) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix ALTER COMMENT queries ON CLUSTER [#56491](https://github.com/ClickHouse/ClickHouse/pull/56491) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix ALTER COLUMN with ALIAS [#56493](https://github.com/ClickHouse/ClickHouse/pull/56493) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix empty NAMED COLLECTIONs [#56494](https://github.com/ClickHouse/ClickHouse/pull/56494) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix two cases of projection analysis. [#56502](https://github.com/ClickHouse/ClickHouse/pull/56502) ([Amos Bird](https://github.com/amosbird)).
+* Fix handling of aliases in query cache [#56545](https://github.com/ClickHouse/ClickHouse/pull/56545) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix conversion from `Nullable(Enum)` to `Nullable(String)` [#56644](https://github.com/ClickHouse/ClickHouse/pull/56644) ([Nikolay Degterinsky](https://github.com/evillique)).
+* More reliable log handling in Keeper [#56670](https://github.com/ClickHouse/ClickHouse/pull/56670) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix configuration merge for nodes with substitution attributes [#56694](https://github.com/ClickHouse/ClickHouse/pull/56694) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Fix duplicate usage of table function input(). [#56695](https://github.com/ClickHouse/ClickHouse/pull/56695) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix: RabbitMQ OpenSSL dynamic loading issue [#56703](https://github.com/ClickHouse/ClickHouse/pull/56703) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix crash in GCD codec in case when zeros present in data [#56704](https://github.com/ClickHouse/ClickHouse/pull/56704) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix 'mutex lock failed: Invalid argument' in clickhouse-local during insert into function [#56710](https://github.com/ClickHouse/ClickHouse/pull/56710) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix Date text parsing in optimistic path [#56765](https://github.com/ClickHouse/ClickHouse/pull/56765) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix crash in FPC codec [#56795](https://github.com/ClickHouse/ClickHouse/pull/56795) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* DatabaseReplicated: fix DDL query timeout after recovering a replica [#56796](https://github.com/ClickHouse/ClickHouse/pull/56796) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix incorrect nullable columns reporting in MySQL binary protocol [#56799](https://github.com/ClickHouse/ClickHouse/pull/56799) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Support Iceberg metadata files for metastore tables [#56810](https://github.com/ClickHouse/ClickHouse/pull/56810) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix TSAN report under transform [#56817](https://github.com/ClickHouse/ClickHouse/pull/56817) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix SET query and SETTINGS formatting [#56825](https://github.com/ClickHouse/ClickHouse/pull/56825) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix failure to start due to table dependency in joinGet [#56828](https://github.com/ClickHouse/ClickHouse/pull/56828) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix flattening existing Nested columns during ADD COLUMN [#56830](https://github.com/ClickHouse/ClickHouse/pull/56830) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix allow cr end of line for csv [#56901](https://github.com/ClickHouse/ClickHouse/pull/56901) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Fix `tryBase64Decode()` with invalid input [#56913](https://github.com/ClickHouse/ClickHouse/pull/56913) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix generating deep nested columns in CapnProto/Protobuf schemas [#56941](https://github.com/ClickHouse/ClickHouse/pull/56941) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prevent incompatible ALTER of projection columns [#56948](https://github.com/ClickHouse/ClickHouse/pull/56948) ([Amos Bird](https://github.com/amosbird)).
+* Fix sqlite file path validation [#56984](https://github.com/ClickHouse/ClickHouse/pull/56984) ([San](https://github.com/santrancisco)).
+* S3Queue: fix metadata reference increment  [#56990](https://github.com/ClickHouse/ClickHouse/pull/56990) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* S3Queue minor fix [#56999](https://github.com/ClickHouse/ClickHouse/pull/56999) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix file path validation for DatabaseFileSystem [#57029](https://github.com/ClickHouse/ClickHouse/pull/57029) ([San](https://github.com/santrancisco)).
+* Fix `fuzzBits` with `ARRAY JOIN` [#57033](https://github.com/ClickHouse/ClickHouse/pull/57033) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix Nullptr dereference in partial merge join with joined_subquery_re… [#57048](https://github.com/ClickHouse/ClickHouse/pull/57048) ([vdimir](https://github.com/vdimir)).
+* Fix race condition in RemoteSource [#57052](https://github.com/ClickHouse/ClickHouse/pull/57052) ([Raúl Marín](https://github.com/Algunenano)).
+* Implement `bitHammingDistance` for big integers [#57073](https://github.com/ClickHouse/ClickHouse/pull/57073) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* S3-style links bug fix [#57075](https://github.com/ClickHouse/ClickHouse/pull/57075) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Fix JSON_QUERY function with multiple numeric paths [#57096](https://github.com/ClickHouse/ClickHouse/pull/57096) ([KevinyhZou](https://github.com/KevinyhZou)).
+* Fix buffer overflow in Gorilla codec [#57107](https://github.com/ClickHouse/ClickHouse/pull/57107) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Close interserver connection on any exception before authentication [#57142](https://github.com/ClickHouse/ClickHouse/pull/57142) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix segfault after ALTER UPDATE with Nullable MATERIALIZED column [#57147](https://github.com/ClickHouse/ClickHouse/pull/57147) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix incorrect JOIN plan optimization with partially materialized normal projection [#57196](https://github.com/ClickHouse/ClickHouse/pull/57196) ([Amos Bird](https://github.com/amosbird)).
+* Ignore comments when comparing column descriptions [#57259](https://github.com/ClickHouse/ClickHouse/pull/57259) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix `ReadonlyReplica` metric for all cases [#57267](https://github.com/ClickHouse/ClickHouse/pull/57267) ([Antonio Andelic](https://github.com/antonio2368)).
+* Background merges correctly use temporary data storage in the cache [#57275](https://github.com/ClickHouse/ClickHouse/pull/57275) ([vdimir](https://github.com/vdimir)).
+* Keeper fix for changelog and snapshots [#57299](https://github.com/ClickHouse/ClickHouse/pull/57299) ([Antonio Andelic](https://github.com/antonio2368)).
+* Ignore finished ON CLUSTER tasks if hostname changed [#57339](https://github.com/ClickHouse/ClickHouse/pull/57339) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* MergeTree mutations reuse source part index granularity [#57352](https://github.com/ClickHouse/ClickHouse/pull/57352) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix function jsonMergePatch for partially const columns [#57379](https://github.com/ClickHouse/ClickHouse/pull/57379) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix ubsan error in `Arena` [#57407](https://github.com/ClickHouse/ClickHouse/pull/57407) ([Nikita Taranov](https://github.com/nickitat)).
+* fs cache: add limit for background download [#57424](https://github.com/ClickHouse/ClickHouse/pull/57424) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* bugfix: correctly parse SYSTEM STOP LISTEN TCP SECURE [#57483](https://github.com/ClickHouse/ClickHouse/pull/57483) ([joelynch](https://github.com/joelynch)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Revert "Add function `arrayRandomSample()`"'. [#56399](https://github.com/ClickHouse/ClickHouse/pull/56399) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Update README.md'. [#56549](https://github.com/ClickHouse/ClickHouse/pull/56549) ([Tyler Hannan](https://github.com/tylerhannan)).
+* NO CL ENTRY:  'Revert "FunctionSleep exception message fix"'. [#56591](https://github.com/ClickHouse/ClickHouse/pull/56591) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Inserting only non-duplicate chunks in MV"'. [#56598](https://github.com/ClickHouse/ClickHouse/pull/56598) ([Maksim Kita](https://github.com/kitaisreal)).
+* NO CL ENTRY:  'Add new header for README with updated logo'. [#56607](https://github.com/ClickHouse/ClickHouse/pull/56607) ([Justin de Guzman](https://github.com/justindeguzman)).
+* NO CL ENTRY:  'Revert "Add /keeper/availability-zone node to allow server load balancing within AZ."'. [#56610](https://github.com/ClickHouse/ClickHouse/pull/56610) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Add 4-letter command for yielding/resigning leadership"'. [#56611](https://github.com/ClickHouse/ClickHouse/pull/56611) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'fix(docs): correct default value for output_format_parquet_compression_method to 'lz4''. [#56614](https://github.com/ClickHouse/ClickHouse/pull/56614) ([james-seymour-cubiko](https://github.com/james-seymour-cubiko)).
+* NO CL ENTRY:  'Update except.md'. [#56651](https://github.com/ClickHouse/ClickHouse/pull/56651) ([rondo_1895](https://github.com/yangguang1991)).
+* NO CL ENTRY:  'Revert "Add a setting max_execution_time_leaf to limit the execution time on shard for distributed query"'. [#56702](https://github.com/ClickHouse/ClickHouse/pull/56702) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Better except for SSL authentication failure"'. [#56844](https://github.com/ClickHouse/ClickHouse/pull/56844) ([Antonio Andelic](https://github.com/antonio2368)).
+* NO CL ENTRY:  'Revert "s3 adaptive timeouts"'. [#56992](https://github.com/ClickHouse/ClickHouse/pull/56992) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Revert "s3 adaptive timeouts""'. [#56994](https://github.com/ClickHouse/ClickHouse/pull/56994) ([Sema Checherinda](https://github.com/CheSema)).
+* NO CL ENTRY:  'Revert "Resubmit 01600_parts_types_metrics test (possibly without flakiness)"'. [#57163](https://github.com/ClickHouse/ClickHouse/pull/57163) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Mark select() as harmful function"'. [#57195](https://github.com/ClickHouse/ClickHouse/pull/57195) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* NO CL ENTRY:  'Revert "Update Sentry"'. [#57229](https://github.com/ClickHouse/ClickHouse/pull/57229) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Add debugging info for 01600_parts_types_metrics on failures"'. [#57232](https://github.com/ClickHouse/ClickHouse/pull/57232) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Update date-time-functions.md"'. [#57329](https://github.com/ClickHouse/ClickHouse/pull/57329) ([Denny Crane](https://github.com/den-crane)).
+* NO CL ENTRY:  'Revert "add function getClientHTTPHeader"'. [#57510](https://github.com/ClickHouse/ClickHouse/pull/57510) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Add `sqid()` function"'. [#57511](https://github.com/ClickHouse/ClickHouse/pull/57511) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Add new aggregation function groupArraySorted()"'. [#57519](https://github.com/ClickHouse/ClickHouse/pull/57519) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Implemented series period detect method using pocketfft lib"'. [#57536](https://github.com/ClickHouse/ClickHouse/pull/57536) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Support use alias column in indices"'. [#57537](https://github.com/ClickHouse/ClickHouse/pull/57537) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Remove useless "install" from CMake (step 1) [#36589](https://github.com/ClickHouse/ClickHouse/pull/36589) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Analyzer support 'is not distinct from' in join on section [#54068](https://github.com/ClickHouse/ClickHouse/pull/54068) ([vdimir](https://github.com/vdimir)).
+* Refactor merge join transform [#55007](https://github.com/ClickHouse/ClickHouse/pull/55007) ([Alex Cheng](https://github.com/Alex-Cheng)).
+* Add function jaccardIndex back with better performance [#55126](https://github.com/ClickHouse/ClickHouse/pull/55126) ([vdimir](https://github.com/vdimir)).
+* Use more thread pools in BACKUP/RESTORE to avoid its hanging in tests [#55216](https://github.com/ClickHouse/ClickHouse/pull/55216) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Parallel replicas: progress bar [#55574](https://github.com/ClickHouse/ClickHouse/pull/55574) ([Igor Nikonov](https://github.com/devcrafter)).
+* Analyzer: Fix result type after IfConstantConditionPass [#55951](https://github.com/ClickHouse/ClickHouse/pull/55951) ([Dmitry Novik](https://github.com/novikd)).
+* RemoteSource: remove unnecessary flag [#55980](https://github.com/ClickHouse/ClickHouse/pull/55980) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix `REPLICA_ALREADY_EXISTS` for ReplicatedMergeTree [#56000](https://github.com/ClickHouse/ClickHouse/pull/56000) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Rework [#52159](https://github.com/ClickHouse/ClickHouse/issues/52159) to avoid coredump generation [#56039](https://github.com/ClickHouse/ClickHouse/pull/56039) ([Raúl Marín](https://github.com/Algunenano)).
+* Bump gRPC to v1.47.5 [#56059](https://github.com/ClickHouse/ClickHouse/pull/56059) ([Robert Schulze](https://github.com/rschu1ze)).
+* See what happens if we use less different docker images in integration tests [#56082](https://github.com/ClickHouse/ClickHouse/pull/56082) ([Raúl Marín](https://github.com/Algunenano)).
+* Add missing zookeeper retries in StorageReplicatedMergeTree::backupData  [#56131](https://github.com/ClickHouse/ClickHouse/pull/56131) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Better process broken parts on table start for replicated tables [#56142](https://github.com/ClickHouse/ClickHouse/pull/56142) ([alesapin](https://github.com/alesapin)).
+* Add more details to "Data after merge is not byte-identical to data on another replicas" [#56164](https://github.com/ClickHouse/ClickHouse/pull/56164) ([Azat Khuzhin](https://github.com/azat)).
+* Revert "Revert "Fix output/input of Arrow dictionary column"" [#56167](https://github.com/ClickHouse/ClickHouse/pull/56167) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add a log message for DatabaseReplicated [#56215](https://github.com/ClickHouse/ClickHouse/pull/56215) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Correct aggregate function cross tab accessors to be endianness-independent. [#56223](https://github.com/ClickHouse/ClickHouse/pull/56223) ([Austin Kothig](https://github.com/kothiga)).
+* Fix client suggestions for user without grants [#56234](https://github.com/ClickHouse/ClickHouse/pull/56234) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix link to failed check report in status commit [#56243](https://github.com/ClickHouse/ClickHouse/pull/56243) ([vdimir](https://github.com/vdimir)).
+* Analyzer: fix 01019_alter_materialized_view_consistent [#56246](https://github.com/ClickHouse/ClickHouse/pull/56246) ([vdimir](https://github.com/vdimir)).
+* Properly process aliases for aggregation-by-partition optimization. [#56254](https://github.com/ClickHouse/ClickHouse/pull/56254) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* deltalake: Do not raise errors when processing add and remove actions [#56260](https://github.com/ClickHouse/ClickHouse/pull/56260) ([joelynch](https://github.com/joelynch)).
+* Fix rare logical error in Replicated database [#56272](https://github.com/ClickHouse/ClickHouse/pull/56272) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Update version_date.tsv and changelogs after v23.10.1.1976-stable [#56278](https://github.com/ClickHouse/ClickHouse/pull/56278) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Add assertion that `SizePredictor` is set if `preferred_block_size_bytes` is set [#56302](https://github.com/ClickHouse/ClickHouse/pull/56302) ([Nikita Taranov](https://github.com/nickitat)).
+* Implement digest helpers for different objects [#56305](https://github.com/ClickHouse/ClickHouse/pull/56305) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Removed stale events from README [#56311](https://github.com/ClickHouse/ClickHouse/pull/56311) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Fix more tests with analyzer. [#56315](https://github.com/ClickHouse/ClickHouse/pull/56315) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Change some exception codes [#56316](https://github.com/ClickHouse/ClickHouse/pull/56316) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix using table shared id during backup and improve logs. [#56339](https://github.com/ClickHouse/ClickHouse/pull/56339) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Print info while decompressing the binary [#56360](https://github.com/ClickHouse/ClickHouse/pull/56360) ([Antonio Andelic](https://github.com/antonio2368)).
+* remove unstable test test_heavy_insert_select_check_memory [#56369](https://github.com/ClickHouse/ClickHouse/pull/56369) ([Sema Checherinda](https://github.com/CheSema)).
+* Update test_storage_s3_queue/test.py [#56370](https://github.com/ClickHouse/ClickHouse/pull/56370) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update 02735_system_zookeeper_connection.sql [#56374](https://github.com/ClickHouse/ClickHouse/pull/56374) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Cleanup convenience functions in IDataType [#56375](https://github.com/ClickHouse/ClickHouse/pull/56375) ([Robert Schulze](https://github.com/rschu1ze)).
+* Update test_storage_s3_queue [#56376](https://github.com/ClickHouse/ClickHouse/pull/56376) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Minor improvements for S3Queue [#56377](https://github.com/ClickHouse/ClickHouse/pull/56377) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add obsolete setting back [#56382](https://github.com/ClickHouse/ClickHouse/pull/56382) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Rewrite jobs to use callable workflow [#56385](https://github.com/ClickHouse/ClickHouse/pull/56385) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update stress.py [#56388](https://github.com/ClickHouse/ClickHouse/pull/56388) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix rocksdb with analyzer. [#56391](https://github.com/ClickHouse/ClickHouse/pull/56391) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Option to check particular file with utils/check-style/check-doc-aspell [#56394](https://github.com/ClickHouse/ClickHouse/pull/56394) ([vdimir](https://github.com/vdimir)).
+* Add a metric for suspicious parts in ZooKeeper [#56395](https://github.com/ClickHouse/ClickHouse/pull/56395) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix 02404_memory_bound_merging with analyzer. [#56419](https://github.com/ClickHouse/ClickHouse/pull/56419) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* move storage_metadata_write_full_object_key setting to the server scope [#56421](https://github.com/ClickHouse/ClickHouse/pull/56421) ([Sema Checherinda](https://github.com/CheSema)).
+* Make autoscaling more responsive [#56422](https://github.com/ClickHouse/ClickHouse/pull/56422) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix `test_attach_without_fetching` [#56429](https://github.com/ClickHouse/ClickHouse/pull/56429) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Use `pcg` + `randomSeed()` instead of `std::mt19937`/`std::random_device` [#56430](https://github.com/ClickHouse/ClickHouse/pull/56430) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix test `02725_database_hdfs.sh`  [#56457](https://github.com/ClickHouse/ClickHouse/pull/56457) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update the AMI receipt [#56459](https://github.com/ClickHouse/ClickHouse/pull/56459) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Make IMergeTreeDataPart::getState() inlinable [#56461](https://github.com/ClickHouse/ClickHouse/pull/56461) ([Alexander Gololobov](https://github.com/davenger)).
+* Update version_date.tsv and changelogs after v23.10.2.13-stable [#56467](https://github.com/ClickHouse/ClickHouse/pull/56467) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.9.4.11-stable [#56468](https://github.com/ClickHouse/ClickHouse/pull/56468) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.8.6.16-lts [#56469](https://github.com/ClickHouse/ClickHouse/pull/56469) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.16.7-lts [#56470](https://github.com/ClickHouse/ClickHouse/pull/56470) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Disable randomization of allow_experimental_block_number_column flag [#56474](https://github.com/ClickHouse/ClickHouse/pull/56474) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Parallel clone sparse/shallow submodules [#56479](https://github.com/ClickHouse/ClickHouse/pull/56479) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix default port for Replicated database cluster [#56486](https://github.com/ClickHouse/ClickHouse/pull/56486) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Updated compression to LZ4  [#56497](https://github.com/ClickHouse/ClickHouse/pull/56497) ([SmitaRKulkarni](https://github.com/SmitaRKulkarni)).
+* Analyzer remove unused projection columns [#56499](https://github.com/ClickHouse/ClickHouse/pull/56499) ([Maksim Kita](https://github.com/kitaisreal)).
+* FunctionSleep exception message fix [#56500](https://github.com/ClickHouse/ClickHouse/pull/56500) ([Maksim Kita](https://github.com/kitaisreal)).
+* Continue rewriting workflows to reusable tests [#56501](https://github.com/ClickHouse/ClickHouse/pull/56501) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Analyzer special functions projection names fix [#56514](https://github.com/ClickHouse/ClickHouse/pull/56514) ([Maksim Kita](https://github.com/kitaisreal)).
+* CTE invalid query analysis add test [#56517](https://github.com/ClickHouse/ClickHouse/pull/56517) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix compilation of BackupsWorker.cpp [#56518](https://github.com/ClickHouse/ClickHouse/pull/56518) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Analyzer MoveFunctionsOutOfAnyPass refactoring [#56520](https://github.com/ClickHouse/ClickHouse/pull/56520) ([Maksim Kita](https://github.com/kitaisreal)).
+* Analyzer support EXPLAIN ESTIMATE [#56522](https://github.com/ClickHouse/ClickHouse/pull/56522) ([Maksim Kita](https://github.com/kitaisreal)).
+* Analyzer log used row policies [#56531](https://github.com/ClickHouse/ClickHouse/pull/56531) ([Maksim Kita](https://github.com/kitaisreal)).
+* Analyzer ORDER BY read in order query plan add test [#56532](https://github.com/ClickHouse/ClickHouse/pull/56532) ([Maksim Kita](https://github.com/kitaisreal)).
+* ReplicatedMergeTree: check shutdown flags in retry loops [#56533](https://github.com/ClickHouse/ClickHouse/pull/56533) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix race between REPLACE_RANGE and GET_PART (set actual part name when fetching) [#56536](https://github.com/ClickHouse/ClickHouse/pull/56536) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Bump gRPC to v1.54.3 [#56543](https://github.com/ClickHouse/ClickHouse/pull/56543) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix flaky LDAP integration tests [#56544](https://github.com/ClickHouse/ClickHouse/pull/56544) ([Julian Maicher](https://github.com/jmaicher)).
+* Remove useless using [#56546](https://github.com/ClickHouse/ClickHouse/pull/56546) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Better warning message [#56547](https://github.com/ClickHouse/ClickHouse/pull/56547) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Allow `chassert` to guide the static analyzer [#56552](https://github.com/ClickHouse/ClickHouse/pull/56552) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove C++ templates [#56556](https://github.com/ClickHouse/ClickHouse/pull/56556) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix `test_keeper_four_word_command/test.py::test_cmd_crst` [#56570](https://github.com/ClickHouse/ClickHouse/pull/56570) ([Antonio Andelic](https://github.com/antonio2368)).
+* Delete unnecessary file from tests [#56572](https://github.com/ClickHouse/ClickHouse/pull/56572) ([vdimir](https://github.com/vdimir)).
+* Analyzer: fix logical error with set in array join [#56587](https://github.com/ClickHouse/ClickHouse/pull/56587) ([vdimir](https://github.com/vdimir)).
+* hide VERSION_INLINE_DATA under feature flag [#56594](https://github.com/ClickHouse/ClickHouse/pull/56594) ([Sema Checherinda](https://github.com/CheSema)).
+* Fix 02554_fix_grouping_sets_predicate_push_down with analyzer. [#56595](https://github.com/ClickHouse/ClickHouse/pull/56595) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Add "FunctionSleep exception message fix" again [#56597](https://github.com/ClickHouse/ClickHouse/pull/56597) ([Raúl Marín](https://github.com/Algunenano)).
+* Update version_date.tsv and changelogs after v23.10.3.5-stable [#56606](https://github.com/ClickHouse/ClickHouse/pull/56606) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Remove bad test [#56612](https://github.com/ClickHouse/ClickHouse/pull/56612) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Symbolize `trace_log` for exporting [#56613](https://github.com/ClickHouse/ClickHouse/pull/56613) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add indices to exported system logs [#56615](https://github.com/ClickHouse/ClickHouse/pull/56615) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove dependencies [#56616](https://github.com/ClickHouse/ClickHouse/pull/56616) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* WIP: Add test describing MV deduplication issues [#56621](https://github.com/ClickHouse/ClickHouse/pull/56621) ([Jordi Villar](https://github.com/jrdi)).
+* Add test for ROW POLICY ON CLUSTER [#56623](https://github.com/ClickHouse/ClickHouse/pull/56623) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Enable --secure flag for clickhouse-client for hostnames pointing to clickhouse cloud [#56638](https://github.com/ClickHouse/ClickHouse/pull/56638) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Continue with work from [#56621](https://github.com/ClickHouse/ClickHouse/issues/56621) [#56641](https://github.com/ClickHouse/ClickHouse/pull/56641) ([Jordi Villar](https://github.com/jrdi)).
+* Switch to SSL port for clickhouse-client for hostnames pointing to clickhouse cloud [#56649](https://github.com/ClickHouse/ClickHouse/pull/56649) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Remove garbage from libssh [#56654](https://github.com/ClickHouse/ClickHouse/pull/56654) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Delete a file [#56655](https://github.com/ClickHouse/ClickHouse/pull/56655) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Delete a file (2) [#56656](https://github.com/ClickHouse/ClickHouse/pull/56656) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove some entries from `analyzer_tech_debt.txt` [#56658](https://github.com/ClickHouse/ClickHouse/pull/56658) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Miscellaneous [#56662](https://github.com/ClickHouse/ClickHouse/pull/56662) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Bump gRPC to v1.55.4 and protobuf to v22.5 [#56664](https://github.com/ClickHouse/ClickHouse/pull/56664) ([Robert Schulze](https://github.com/rschu1ze)).
+* Small refactoring of AST hash calculation (follow-up to [#56545](https://github.com/ClickHouse/ClickHouse/issues/56545)) [#56665](https://github.com/ClickHouse/ClickHouse/pull/56665) ([Robert Schulze](https://github.com/rschu1ze)).
+* Analyzer: filtering by virtual columns for StorageS3 [#56668](https://github.com/ClickHouse/ClickHouse/pull/56668) ([vdimir](https://github.com/vdimir)).
+* Add back flaky tests to analyzer_tech_debt.txt [#56669](https://github.com/ClickHouse/ClickHouse/pull/56669) ([Raúl Marín](https://github.com/Algunenano)).
+* gRPC: remove build dependency on systemd [#56671](https://github.com/ClickHouse/ClickHouse/pull/56671) ([Raúl Marín](https://github.com/Algunenano)).
+* Remove unused code [#56677](https://github.com/ClickHouse/ClickHouse/pull/56677) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix missing argument for style_check.py in master workflow [#56691](https://github.com/ClickHouse/ClickHouse/pull/56691) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix unexpected parts handling [#56693](https://github.com/ClickHouse/ClickHouse/pull/56693) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Revert "Revert "Add a setting max_execution_time_leaf to limit the execution time on shard for distributed query"" [#56707](https://github.com/ClickHouse/ClickHouse/pull/56707) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix use_structure_from_insertion_table_in_table_functions with new Analyzer [#56708](https://github.com/ClickHouse/ClickHouse/pull/56708) ([Kruglov Pavel](https://github.com/Avogar)).
+* Disable settings randomisation for `02896_memory_accounting_for_user.sh` [#56709](https://github.com/ClickHouse/ClickHouse/pull/56709) ([Nikita Taranov](https://github.com/nickitat)).
+* Light autogenerated file [#56720](https://github.com/ClickHouse/ClickHouse/pull/56720) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Less CMake checks [#56721](https://github.com/ClickHouse/ClickHouse/pull/56721) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove orphan header files [#56722](https://github.com/ClickHouse/ClickHouse/pull/56722) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Try to fix hang in 01104_distributed_numbers_test [#56764](https://github.com/ClickHouse/ClickHouse/pull/56764) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Test RabbitMQ with secure connection [#56767](https://github.com/ClickHouse/ClickHouse/pull/56767) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix flaky test_replicated_merge_tree_encryption_codec. [#56768](https://github.com/ClickHouse/ClickHouse/pull/56768) ([Vitaly Baranov](https://github.com/vitlibar)).
+* fix typo in ClickHouseDictionarySource [#56776](https://github.com/ClickHouse/ClickHouse/pull/56776) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Fix pygithub [#56778](https://github.com/ClickHouse/ClickHouse/pull/56778) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add test for avoided recursion [#56785](https://github.com/ClickHouse/ClickHouse/pull/56785) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix randomization of Keeper configs in stress tests [#56788](https://github.com/ClickHouse/ClickHouse/pull/56788) ([Antonio Andelic](https://github.com/antonio2368)).
+* Try fix `No user in current context, it's a bug` [#56789](https://github.com/ClickHouse/ClickHouse/pull/56789) ([Antonio Andelic](https://github.com/antonio2368)).
+* Update avg_weighted.xml [#56797](https://github.com/ClickHouse/ClickHouse/pull/56797) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Better except for SSL authentication failure [#56811](https://github.com/ClickHouse/ClickHouse/pull/56811) ([Nikolay Degterinsky](https://github.com/evillique)).
+* More stable `test_keeper_reconfig_replace_leader` [#56835](https://github.com/ClickHouse/ClickHouse/pull/56835) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add cancellation hook for moving background operation [#56846](https://github.com/ClickHouse/ClickHouse/pull/56846) ([Aleksei Filatov](https://github.com/aalexfvk)).
+* Updated comment in universal.sh [#56852](https://github.com/ClickHouse/ClickHouse/pull/56852) ([Robert Schulze](https://github.com/rschu1ze)).
+* Bump gRPC to v1.59 and protobuf to v24.4 [#56853](https://github.com/ClickHouse/ClickHouse/pull/56853) ([Robert Schulze](https://github.com/rschu1ze)).
+* Better exception messages [#56854](https://github.com/ClickHouse/ClickHouse/pull/56854) ([Antonio Andelic](https://github.com/antonio2368)).
+* Sparse checkout: Use `--remote` for `git submodule update` [#56857](https://github.com/ClickHouse/ClickHouse/pull/56857) ([Aleksandr Musorin](https://github.com/AVMusorin)).
+* Fix `test_keeper_broken_logs` [#56858](https://github.com/ClickHouse/ClickHouse/pull/56858) ([Antonio Andelic](https://github.com/antonio2368)).
+* CMake: Small cleanup in cpu_features.cmake [#56861](https://github.com/ClickHouse/ClickHouse/pull/56861) ([Robert Schulze](https://github.com/rschu1ze)).
+* Planner support transactions [#56867](https://github.com/ClickHouse/ClickHouse/pull/56867) ([Maksim Kita](https://github.com/kitaisreal)).
+* Improve diagnostics in test 02908_many_requests_to_system_replicas [#56869](https://github.com/ClickHouse/ClickHouse/pull/56869) ([Alexander Gololobov](https://github.com/davenger)).
+* Update 01052_window_view_proc_tumble_to_now.sh [#56870](https://github.com/ClickHouse/ClickHouse/pull/56870) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Call cache check a bit more often [#56872](https://github.com/ClickHouse/ClickHouse/pull/56872) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update test_storage_s3_queue/test.py [#56874](https://github.com/ClickHouse/ClickHouse/pull/56874) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix perf tests report when there are no tests [#56881](https://github.com/ClickHouse/ClickHouse/pull/56881) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Remove ctest [#56894](https://github.com/ClickHouse/ClickHouse/pull/56894) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Simpler CMake [#56898](https://github.com/ClickHouse/ClickHouse/pull/56898) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* test for [#56790](https://github.com/ClickHouse/ClickHouse/issues/56790) [#56899](https://github.com/ClickHouse/ClickHouse/pull/56899) ([Denny Crane](https://github.com/den-crane)).
+* Allow delegate disk to handle retries for createDirectories [#56905](https://github.com/ClickHouse/ClickHouse/pull/56905) ([Alexander Gololobov](https://github.com/davenger)).
+* Update version_date.tsv and changelogs after v23.10.4.25-stable [#56906](https://github.com/ClickHouse/ClickHouse/pull/56906) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.17.13-lts [#56907](https://github.com/ClickHouse/ClickHouse/pull/56907) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.8.7.24-lts [#56908](https://github.com/ClickHouse/ClickHouse/pull/56908) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.9.5.29-stable [#56909](https://github.com/ClickHouse/ClickHouse/pull/56909) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Remove outdated instructions [#56911](https://github.com/ClickHouse/ClickHouse/pull/56911) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Avoid dependencies with no fixed versions [#56914](https://github.com/ClickHouse/ClickHouse/pull/56914) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix race on zk_log initialization [#56915](https://github.com/ClickHouse/ClickHouse/pull/56915) ([Alexander Gololobov](https://github.com/davenger)).
+* Check what will happen if I remove some lines [#56916](https://github.com/ClickHouse/ClickHouse/pull/56916) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update fasttest [#56919](https://github.com/ClickHouse/ClickHouse/pull/56919) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Make some tests independent of macro settings [#56927](https://github.com/ClickHouse/ClickHouse/pull/56927) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix flaky 02494_query_cache_events [#56935](https://github.com/ClickHouse/ClickHouse/pull/56935) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add CachedReadBufferReadFromCache{Hits,Misses} profile events [#56936](https://github.com/ClickHouse/ClickHouse/pull/56936) ([Jordi Villar](https://github.com/jrdi)).
+* Send fatal logs by default in clickhouse-local [#56956](https://github.com/ClickHouse/ClickHouse/pull/56956) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Resubmit: Better except for SSL authentication [#56957](https://github.com/ClickHouse/ClickHouse/pull/56957) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix `test_keeper_auth` [#56960](https://github.com/ClickHouse/ClickHouse/pull/56960) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fewer concurrent requests in 02908_many_requests_to_system_replicas [#56968](https://github.com/ClickHouse/ClickHouse/pull/56968) ([Alexander Gololobov](https://github.com/davenger)).
+* Own CMake for GRPC [#56971](https://github.com/ClickHouse/ClickHouse/pull/56971) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix build in Backups/BackupIO_S3.cpp [#56974](https://github.com/ClickHouse/ClickHouse/pull/56974) ([Robert Schulze](https://github.com/rschu1ze)).
+* Add exclude for tryBase64Decode to backward compat test (follow-up to [#56913](https://github.com/ClickHouse/ClickHouse/issues/56913)) [#56975](https://github.com/ClickHouse/ClickHouse/pull/56975) ([Robert Schulze](https://github.com/rschu1ze)).
+* Prefer sccache to ccache by default [#56980](https://github.com/ClickHouse/ClickHouse/pull/56980) ([Igor Nikonov](https://github.com/devcrafter)).
+* update 02003_memory_limit_in_client.sh [#56981](https://github.com/ClickHouse/ClickHouse/pull/56981) ([Bharat Nallan](https://github.com/bharatnc)).
+* Make check for the limited cmake dependencies the part of sparse checkout [#56991](https://github.com/ClickHouse/ClickHouse/pull/56991) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix flaky and slow tests. [#56993](https://github.com/ClickHouse/ClickHouse/pull/56993) ([Amos Bird](https://github.com/amosbird)).
+* Fix dropping tables in test_create_or_drop_tables_during_backup [#57007](https://github.com/ClickHouse/ClickHouse/pull/57007) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Enable Analyzer in Stress and Fuzz tests [#57008](https://github.com/ClickHouse/ClickHouse/pull/57008) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Run CI for PRs with missing documentation [#57018](https://github.com/ClickHouse/ClickHouse/pull/57018) ([Michael Kolupaev](https://github.com/al13n321)).
+* test_s3_engine_heavy_write_check_mem: turn test off [#57025](https://github.com/ClickHouse/ClickHouse/pull/57025) ([Sema Checherinda](https://github.com/CheSema)).
+* NamedCollections: make exception message more informative. [#57031](https://github.com/ClickHouse/ClickHouse/pull/57031) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Avoid returning biggest resolution when fpr > 0.283 [#57034](https://github.com/ClickHouse/ClickHouse/pull/57034) ([Jordi Villar](https://github.com/jrdi)).
+* Fix: suppress TSAN in RabbitMQ test [#57040](https://github.com/ClickHouse/ClickHouse/pull/57040) ([Igor Nikonov](https://github.com/devcrafter)).
+* Small Keeper fixes [#57047](https://github.com/ClickHouse/ClickHouse/pull/57047) ([Antonio Andelic](https://github.com/antonio2368)).
+* Parallel replicas: cleanup, narrow dependency [#57054](https://github.com/ClickHouse/ClickHouse/pull/57054) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix gRPC build on macOS [#57061](https://github.com/ClickHouse/ClickHouse/pull/57061) ([Robert Schulze](https://github.com/rschu1ze)).
+* Better comment for ITransformingStep::transformPipeline [#57062](https://github.com/ClickHouse/ClickHouse/pull/57062) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix `Duplicate set` for StorageSet with analyzer. [#57063](https://github.com/ClickHouse/ClickHouse/pull/57063) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Better metadata path [#57083](https://github.com/ClickHouse/ClickHouse/pull/57083) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Analyzer fuzzer 3 (aggregate_functions_null_for_empty for projections) [#57099](https://github.com/ClickHouse/ClickHouse/pull/57099) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Update numbers.md [#57100](https://github.com/ClickHouse/ClickHouse/pull/57100) ([konruvikt](https://github.com/konruvikt)).
+* Fix FunctionNode::toASTImpl [#57102](https://github.com/ClickHouse/ClickHouse/pull/57102) ([vdimir](https://github.com/vdimir)).
+* Analyzer fuzzer 5 [#57103](https://github.com/ClickHouse/ClickHouse/pull/57103) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Cancel PipelineExecutor properly in case of exception in spawnThreads [#57104](https://github.com/ClickHouse/ClickHouse/pull/57104) ([Kruglov Pavel](https://github.com/Avogar)).
+* Allow HashedDictionary/FunctionsConversion as large TU [#57108](https://github.com/ClickHouse/ClickHouse/pull/57108) ([Azat Khuzhin](https://github.com/azat)).
+* Disable checksums for builds with fuzzer [#57122](https://github.com/ClickHouse/ClickHouse/pull/57122) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Analyzer: Fix logical error in LogicalExpressionOptimizerVisitor [#57123](https://github.com/ClickHouse/ClickHouse/pull/57123) ([vdimir](https://github.com/vdimir)).
+* Split HashedDictionary CU [#57124](https://github.com/ClickHouse/ClickHouse/pull/57124) ([Azat Khuzhin](https://github.com/azat)).
+* Cancel executor in ~CreatingSetsTransform [#57125](https://github.com/ClickHouse/ClickHouse/pull/57125) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix system.*_log in artifacts on CI [#57128](https://github.com/ClickHouse/ClickHouse/pull/57128) ([Azat Khuzhin](https://github.com/azat)).
+* Fix something in ReplicatedMergeTree [#57129](https://github.com/ClickHouse/ClickHouse/pull/57129) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Do not symbolize traces for debug/sanitizer builds for sending to cloud [#57130](https://github.com/ClickHouse/ClickHouse/pull/57130) ([Azat Khuzhin](https://github.com/azat)).
+* Resubmit 01600_parts_types_metrics test (possibly without flakiness) [#57131](https://github.com/ClickHouse/ClickHouse/pull/57131) ([Azat Khuzhin](https://github.com/azat)).
+* Follow up to [#56541](https://github.com/ClickHouse/ClickHouse/issues/56541) [#57141](https://github.com/ClickHouse/ClickHouse/pull/57141) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Allow to disable reorder-functions-after-sorting optimization [#57144](https://github.com/ClickHouse/ClickHouse/pull/57144) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix bad test `00002_log_and_exception_messages_formatting` [#57145](https://github.com/ClickHouse/ClickHouse/pull/57145) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix test test_replicated_merge_tree_encryption_codec/test.py::test_different_keys [#57146](https://github.com/ClickHouse/ClickHouse/pull/57146) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Remove partial results from build matrix for stress tests [#57150](https://github.com/ClickHouse/ClickHouse/pull/57150) ([Azat Khuzhin](https://github.com/azat)).
+* Minor changes in test_check_table [#57154](https://github.com/ClickHouse/ClickHouse/pull/57154) ([vdimir](https://github.com/vdimir)).
+* Fix 02903_rmt_retriable_merge_exception flakiness for replicated database [#57155](https://github.com/ClickHouse/ClickHouse/pull/57155) ([Azat Khuzhin](https://github.com/azat)).
+* Mark select() as harmful function [#57156](https://github.com/ClickHouse/ClickHouse/pull/57156) ([Igor Nikonov](https://github.com/devcrafter)).
+* Improve the cherry-pick PR description [#57167](https://github.com/ClickHouse/ClickHouse/pull/57167) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add debugging info for 01600_parts_types_metrics on failures [#57170](https://github.com/ClickHouse/ClickHouse/pull/57170) ([Azat Khuzhin](https://github.com/azat)).
+* Tiny improvement security [#57171](https://github.com/ClickHouse/ClickHouse/pull/57171) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Update blob_storage_log.md [#57187](https://github.com/ClickHouse/ClickHouse/pull/57187) ([vdimir](https://github.com/vdimir)).
+* [RFC] Set log_comment to the file name while processing files in client [#57191](https://github.com/ClickHouse/ClickHouse/pull/57191) ([Azat Khuzhin](https://github.com/azat)).
+* Add test for [#5323](https://github.com/ClickHouse/ClickHouse/issues/5323) [#57192](https://github.com/ClickHouse/ClickHouse/pull/57192) ([Raúl Marín](https://github.com/Algunenano)).
+* Analyzer fuzzer 6 (arrayJoin) [#57198](https://github.com/ClickHouse/ClickHouse/pull/57198) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Add test for [#47366](https://github.com/ClickHouse/ClickHouse/issues/47366) [#57200](https://github.com/ClickHouse/ClickHouse/pull/57200) ([Raúl Marín](https://github.com/Algunenano)).
+* Add test for [#51321](https://github.com/ClickHouse/ClickHouse/issues/51321) [#57202](https://github.com/ClickHouse/ClickHouse/pull/57202) ([Raúl Marín](https://github.com/Algunenano)).
+* Fix possible crash (in Rust) of fuzzy finder in client [#57204](https://github.com/ClickHouse/ClickHouse/pull/57204) ([Azat Khuzhin](https://github.com/azat)).
+* fix zero-copy locks leaking [#57205](https://github.com/ClickHouse/ClickHouse/pull/57205) ([Sema Checherinda](https://github.com/CheSema)).
+* Fix test_distributed_storage_configuration flakiness [#57206](https://github.com/ClickHouse/ClickHouse/pull/57206) ([Azat Khuzhin](https://github.com/azat)).
+* Update Sentry [#57222](https://github.com/ClickHouse/ClickHouse/pull/57222) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version_date.tsv and changelogs after v23.10.5.20-stable [#57223](https://github.com/ClickHouse/ClickHouse/pull/57223) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.9.6.20-stable [#57224](https://github.com/ClickHouse/ClickHouse/pull/57224) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.3.18.15-lts [#57225](https://github.com/ClickHouse/ClickHouse/pull/57225) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Update version_date.tsv and changelogs after v23.8.8.20-lts [#57226](https://github.com/ClickHouse/ClickHouse/pull/57226) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Change cursor style for overwrite mode (INS) to blinking in client [#57227](https://github.com/ClickHouse/ClickHouse/pull/57227) ([Azat Khuzhin](https://github.com/azat)).
+* Remove test `01280_ttl_where_group_by` [#57230](https://github.com/ClickHouse/ClickHouse/pull/57230) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix docs [#57234](https://github.com/ClickHouse/ClickHouse/pull/57234) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Remove addBatchSinglePlaceFromInterval [#57258](https://github.com/ClickHouse/ClickHouse/pull/57258) ([Raúl Marín](https://github.com/Algunenano)).
+* Add some additional groups to CI [#57260](https://github.com/ClickHouse/ClickHouse/pull/57260) ([alesapin](https://github.com/alesapin)).
+* Analyzer: fix result type of aggregate function with NULL [#57265](https://github.com/ClickHouse/ClickHouse/pull/57265) ([vdimir](https://github.com/vdimir)).
+* Ignore memory exception in Keeper asio workers [#57268](https://github.com/ClickHouse/ClickHouse/pull/57268) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix code reports [#57301](https://github.com/ClickHouse/ClickHouse/pull/57301) ([Raúl Marín](https://github.com/Algunenano)).
+* Follow up recommendations from [#57167](https://github.com/ClickHouse/ClickHouse/issues/57167) [#57302](https://github.com/ClickHouse/ClickHouse/pull/57302) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add back flaky tests to analyzer_tech_debt.txt [#57307](https://github.com/ClickHouse/ClickHouse/pull/57307) ([Raúl Marín](https://github.com/Algunenano)).
+* Lower level for annoying S3 log [#57312](https://github.com/ClickHouse/ClickHouse/pull/57312) ([Antonio Andelic](https://github.com/antonio2368)).
+* Add regression test for skim (Rust) crash on pasting certain input [#57313](https://github.com/ClickHouse/ClickHouse/pull/57313) ([Azat Khuzhin](https://github.com/azat)).
+* Remove unused Strings from MergeTreeData [#57318](https://github.com/ClickHouse/ClickHouse/pull/57318) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Address 02668_ulid_decoding flakiness [#57320](https://github.com/ClickHouse/ClickHouse/pull/57320) ([Raúl Marín](https://github.com/Algunenano)).
+* DiskWeb fix [#57322](https://github.com/ClickHouse/ClickHouse/pull/57322) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update README.md [#57325](https://github.com/ClickHouse/ClickHouse/pull/57325) ([Tyler Hannan](https://github.com/tylerhannan)).
+* Add information about new _size virtual column in file/s3/url/hdfs/azure table functions [#57328](https://github.com/ClickHouse/ClickHouse/pull/57328) ([Kruglov Pavel](https://github.com/Avogar)).
+* Follow-up to [#56490](https://github.com/ClickHouse/ClickHouse/issues/56490): Fix build with `cmake -DENABLE_LIBRARIES=0` [#57330](https://github.com/ClickHouse/ClickHouse/pull/57330) ([Robert Schulze](https://github.com/rschu1ze)).
+* Mark a setting obsolete [#57336](https://github.com/ClickHouse/ClickHouse/pull/57336) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Always renew ZK client in `WithRetries` [#57357](https://github.com/ClickHouse/ClickHouse/pull/57357) ([Antonio Andelic](https://github.com/antonio2368)).
+* Shutdown disks after tables [#57358](https://github.com/ClickHouse/ClickHouse/pull/57358) ([Alexander Gololobov](https://github.com/davenger)).
+* Update DDLTask.cpp [#57369](https://github.com/ClickHouse/ClickHouse/pull/57369) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* verbose exception messages for StorageFuzzJSON [#57372](https://github.com/ClickHouse/ClickHouse/pull/57372) ([Julia Kartseva](https://github.com/jkartseva)).
+* Initialize only required disks in clickhouse-disks [#57387](https://github.com/ClickHouse/ClickHouse/pull/57387) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Allow wildcards in directories for partitioned write with File storage [#57391](https://github.com/ClickHouse/ClickHouse/pull/57391) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Add tests for 43202 [#57404](https://github.com/ClickHouse/ClickHouse/pull/57404) ([Raúl Marín](https://github.com/Algunenano)).
+* Consider whole check failure in bugfix validate check as an error [#57413](https://github.com/ClickHouse/ClickHouse/pull/57413) ([vdimir](https://github.com/vdimir)).
+* Change type of s3_cache in test_encrypted_disk [#57416](https://github.com/ClickHouse/ClickHouse/pull/57416) ([vdimir](https://github.com/vdimir)).
+* Add extra debug information on replication consistency errors [#57419](https://github.com/ClickHouse/ClickHouse/pull/57419) ([Raúl Marín](https://github.com/Algunenano)).
+* Don't print server revision in client on connect [#57435](https://github.com/ClickHouse/ClickHouse/pull/57435) ([Nikita Taranov](https://github.com/nickitat)).
+* Adding Sydney Meetup [#57457](https://github.com/ClickHouse/ClickHouse/pull/57457) ([Tyler Hannan](https://github.com/tylerhannan)).
+* Fix adjusting log_comment in case of multiple files passed [#57464](https://github.com/ClickHouse/ClickHouse/pull/57464) ([Azat Khuzhin](https://github.com/azat)).
+* Fix flaky test 02697_stop_reading_on_first_cancel.sh [#57481](https://github.com/ClickHouse/ClickHouse/pull/57481) ([Raúl Marín](https://github.com/Algunenano)).
+* Tiny refactoring around cache [#57482](https://github.com/ClickHouse/ClickHouse/pull/57482) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Decrease default value for `filesystem_prefetch_min_bytes_for_single_read_task` [#57489](https://github.com/ClickHouse/ClickHouse/pull/57489) ([Nikita Taranov](https://github.com/nickitat)).
+* Remove bad test [#57494](https://github.com/ClickHouse/ClickHouse/pull/57494) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add changelog for 23.11 [#57517](https://github.com/ClickHouse/ClickHouse/pull/57517) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Simple cleanup in distributed (while dealing with parallel replicas) [#57518](https://github.com/ClickHouse/ClickHouse/pull/57518) ([Igor Nikonov](https://github.com/devcrafter)).
+* Remove a feature. [#57521](https://github.com/ClickHouse/ClickHouse/pull/57521) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* `S3Queue` is production ready [#57548](https://github.com/ClickHouse/ClickHouse/pull/57548) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Revert "Merge pull request [#56724](https://github.com/ClickHouse/ClickHouse/issues/56724) from canhld94/ch_replicated_column_mismatch" [#57576](https://github.com/ClickHouse/ClickHouse/pull/57576) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
diff --git a/docs/changelogs/v23.11.2.11-stable.md b/docs/changelogs/v23.11.2.11-stable.md
new file mode 100644
index 00000000000..490cc9a4590
--- /dev/null
+++ b/docs/changelogs/v23.11.2.11-stable.md
@@ -0,0 +1,22 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.11.2.11-stable (6e5411358c8) FIXME as compared to v23.11.1.2711-stable (05bc8ef1e02)
+
+#### Improvement
+* Backported in [#57661](https://github.com/ClickHouse/ClickHouse/issues/57661): Handle sigabrt case when getting PostgreSQl table structure with empty array. [#57618](https://github.com/ClickHouse/ClickHouse/pull/57618) ([Mike Kot (Михаил Кот)](https://github.com/myrrc)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Ignore ON CLUSTER clause in grant/revoke queries for management of replicated access entities.  [#57538](https://github.com/ClickHouse/ClickHouse/pull/57538) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix SIGSEGV for aggregation of sparse columns with any() RESPECT NULL [#57710](https://github.com/ClickHouse/ClickHouse/pull/57710) ([Azat Khuzhin](https://github.com/azat)).
+* Fix bug window functions: revert [#39631](https://github.com/ClickHouse/ClickHouse/issues/39631) [#57766](https://github.com/ClickHouse/ClickHouse/pull/57766) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Pin alpine version of integration tests helper container [#57669](https://github.com/ClickHouse/ClickHouse/pull/57669) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+
diff --git a/docs/changelogs/v23.11.3.23-stable.md b/docs/changelogs/v23.11.3.23-stable.md
new file mode 100644
index 00000000000..7fcc65beb54
--- /dev/null
+++ b/docs/changelogs/v23.11.3.23-stable.md
@@ -0,0 +1,26 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.11.3.23-stable (a14ab450b0e) FIXME as compared to v23.11.2.11-stable (6e5411358c8)
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fix invalid memory access in BLAKE3 (Rust) [#57876](https://github.com/ClickHouse/ClickHouse/pull/57876) ([Raúl Marín](https://github.com/Algunenano)).
+* Normalize function names in CREATE INDEX [#57906](https://github.com/ClickHouse/ClickHouse/pull/57906) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix handling of unavailable replicas before first request happened [#57933](https://github.com/ClickHouse/ClickHouse/pull/57933) ([Nikita Taranov](https://github.com/nickitat)).
+* Revert "Fix bug window functions: revert [#39631](https://github.com/ClickHouse/ClickHouse/issues/39631)" [#58031](https://github.com/ClickHouse/ClickHouse/pull/58031) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+
+#### NO CL CATEGORY
+
+* Backported in [#57918](https://github.com/ClickHouse/ClickHouse/issues/57918):. [#57909](https://github.com/ClickHouse/ClickHouse/pull/57909) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Remove heavy rust stable toolchain [#57905](https://github.com/ClickHouse/ClickHouse/pull/57905) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix docker image for integration tests (fixes CI) [#57952](https://github.com/ClickHouse/ClickHouse/pull/57952) ([Azat Khuzhin](https://github.com/azat)).
+* Always use `pread` for reading cache segments [#57970](https://github.com/ClickHouse/ClickHouse/pull/57970) ([Nikita Taranov](https://github.com/nickitat)).
+
diff --git a/docs/changelogs/v23.12.1.1368-stable.md b/docs/changelogs/v23.12.1.1368-stable.md
new file mode 100644
index 00000000000..1a322ae9c0f
--- /dev/null
+++ b/docs/changelogs/v23.12.1.1368-stable.md
@@ -0,0 +1,327 @@
+---
+sidebar_position: 1
+sidebar_label: 2023
+---
+
+# 2023 Changelog
+
+### ClickHouse release v23.12.1.1368-stable (a2faa65b080) FIXME as compared to v23.11.1.2711-stable (05bc8ef1e02)
+
+#### Backward Incompatible Change
+* Fix check for non-deterministic functions in TTL expressions. Previously, you could create a TTL expression with non-deterministic functions in some cases, which could lead to undefined behavior later. This fixes [#37250](https://github.com/ClickHouse/ClickHouse/issues/37250). Disallow TTL expressions that don't depend on any columns of a table by default. It can be allowed back by `SET allow_suspicious_ttl_expressions = 1` or `SET compatibility = '23.11'`. Closes [#37286](https://github.com/ClickHouse/ClickHouse/issues/37286). [#51858](https://github.com/ClickHouse/ClickHouse/pull/51858) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove function `arrayFold` because it has a bug. This closes [#57816](https://github.com/ClickHouse/ClickHouse/issues/57816). This closes [#57458](https://github.com/ClickHouse/ClickHouse/issues/57458). [#57836](https://github.com/ClickHouse/ClickHouse/pull/57836) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove the feature of `is_deleted` row in ReplacingMergeTree and the `CLEANUP` modifier for the OPTIMIZE query. This fixes [#57930](https://github.com/ClickHouse/ClickHouse/issues/57930). This closes [#54988](https://github.com/ClickHouse/ClickHouse/issues/54988). This closes [#54570](https://github.com/ClickHouse/ClickHouse/issues/54570). This closes [#50346](https://github.com/ClickHouse/ClickHouse/issues/50346). This closes [#47579](https://github.com/ClickHouse/ClickHouse/issues/47579). The feature has to be removed because it is not good. We have to remove it as quickly as possible, because there is no other option. [#57932](https://github.com/ClickHouse/ClickHouse/pull/57932) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* The MergeTree setting `clean_deleted_rows` is deprecated, it has no effect anymore. The `CLEANUP` keyword for `OPTIMIZE` is not allowed by default (unless `allow_experimental_replacing_merge_with_cleanup` is enabled). [#58267](https://github.com/ClickHouse/ClickHouse/pull/58267) ([Alexander Tokmakov](https://github.com/tavplubix)).
+
+#### New Feature
+* Allow disabling of HEAD request before GET request. [#54602](https://github.com/ClickHouse/ClickHouse/pull/54602) ([Fionera](https://github.com/fionera)).
+* Add a HTTP endpoint for checking if Keeper is ready to accept traffic. [#55876](https://github.com/ClickHouse/ClickHouse/pull/55876) ([Konstantin Bogdanov](https://github.com/thevar1able)).
+* Add 'union' mode for schema inference. In this mode the resulting table schema is the union of all files schemas (so schema is inferred from each file). The mode of schema inference is controlled by a setting `schema_inference_mode` with 2 possible values - `default` and `union`. Closes [#55428](https://github.com/ClickHouse/ClickHouse/issues/55428). [#55892](https://github.com/ClickHouse/ClickHouse/pull/55892) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add new setting `input_format_csv_try_infer_numbers_from_strings` that allows to infer numbers from strings in CSV format. Closes [#56455](https://github.com/ClickHouse/ClickHouse/issues/56455). [#56859](https://github.com/ClickHouse/ClickHouse/pull/56859) ([Kruglov Pavel](https://github.com/Avogar)).
+* Refreshable materialized views. [#56946](https://github.com/ClickHouse/ClickHouse/pull/56946) ([Michael Kolupaev](https://github.com/al13n321)).
+* Add more warnings on the number of databases, tables. [#57375](https://github.com/ClickHouse/ClickHouse/pull/57375) ([凌涛](https://github.com/lingtaolf)).
+* Added a new mutation command `ALTER TABLE <table> APPLY DELETED MASK`, which allows to enforce applying of mask written by lightweight delete and to remove rows marked as deleted from disk. [#57433](https://github.com/ClickHouse/ClickHouse/pull/57433) ([Anton Popov](https://github.com/CurtizJ)).
+* Added a new SQL function `sqid` to generate Sqids (https://sqids.org/), example: `SELECT sqid(125, 126)`. [#57512](https://github.com/ClickHouse/ClickHouse/pull/57512) ([Robert Schulze](https://github.com/rschu1ze)).
+* Dictionary with `HASHED_ARRAY` (and `COMPLEX_KEY_HASHED_ARRAY`) layout supports `SHARDS` similarly to `HASHED`. [#57544](https://github.com/ClickHouse/ClickHouse/pull/57544) ([vdimir](https://github.com/vdimir)).
+* Add asynchronous metrics for total primary key bytes and total allocated primary key bytes in memory. [#57551](https://github.com/ClickHouse/ClickHouse/pull/57551) ([Bharat Nallan](https://github.com/bharatnc)).
+* Table system.dropped_tables_parts contains parts of system.dropped_tables tables (dropped but not yet removed tables). [#57555](https://github.com/ClickHouse/ClickHouse/pull/57555) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Add `FORMAT_BYTES` as an alias for `formatReadableSize`. [#57592](https://github.com/ClickHouse/ClickHouse/pull/57592) ([Bharat Nallan](https://github.com/bharatnc)).
+* Add SHA512_256 function. [#57645](https://github.com/ClickHouse/ClickHouse/pull/57645) ([Bharat Nallan](https://github.com/bharatnc)).
+* Allow passing optional SESSION_TOKEN to `s3` table function. [#57850](https://github.com/ClickHouse/ClickHouse/pull/57850) ([Shani Elharrar](https://github.com/shanielh)).
+* Clause `ORDER BY` now supports specifying `ALL`, meaning that ClickHouse sorts by all columns in the `SELECT` clause. Example: `SELECT col1, col2 FROM tab WHERE [...] ORDER BY ALL`. [#57875](https://github.com/ClickHouse/ClickHouse/pull/57875) ([zhongyuankai](https://github.com/zhongyuankai)).
+* Added functions for punycode encoding/decoding: `punycodeEncode()` and `punycodeDecode()`. [#57969](https://github.com/ClickHouse/ClickHouse/pull/57969) ([Robert Schulze](https://github.com/rschu1ze)).
+* This PR reproduces the implementation of `PASTE JOIN`, which allows users to join tables without `ON` clause. Example: ``` SQL SELECT * FROM ( SELECT number AS a FROM numbers(2) ) AS t1 PASTE JOIN ( SELECT number AS a FROM numbers(2) ORDER BY a DESC ) AS t2. [#57995](https://github.com/ClickHouse/ClickHouse/pull/57995) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* A handler `/binary` opens a visual viewer of symbols inside the ClickHouse binary. [#58211](https://github.com/ClickHouse/ClickHouse/pull/58211) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### Performance Improvement
+* Made copy between s3 disks using a s3-server-side copy instead of copying through the buffer. Improves `BACKUP/RESTORE` operations and `clickhouse-disks copy` command. [#56744](https://github.com/ClickHouse/ClickHouse/pull/56744) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* HashJoin respects setting `max_joined_block_size_rows` and do not produce large blocks for `ALL JOIN`. [#56996](https://github.com/ClickHouse/ClickHouse/pull/56996) ([vdimir](https://github.com/vdimir)).
+* Release memory for aggregation earlier. This may avoid unnecessary external aggregation. [#57691](https://github.com/ClickHouse/ClickHouse/pull/57691) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Improve performance of string serialization. [#57717](https://github.com/ClickHouse/ClickHouse/pull/57717) ([Maksim Kita](https://github.com/kitaisreal)).
+* Support trivial count optimization for `Merge`-engine tables. [#57867](https://github.com/ClickHouse/ClickHouse/pull/57867) ([skyoct](https://github.com/skyoct)).
+* Optimized aggregation in some cases. [#57872](https://github.com/ClickHouse/ClickHouse/pull/57872) ([Anton Popov](https://github.com/CurtizJ)).
+* The `hasAny()` function can now take advantage of the full-text skipping indices. [#57878](https://github.com/ClickHouse/ClickHouse/pull/57878) ([Jpnock](https://github.com/Jpnock)).
+* Function `if(cond, then, else)` (and its alias `cond ? : then : else`) were optimized to use branch-free evaluation. [#57885](https://github.com/ClickHouse/ClickHouse/pull/57885) ([zhanglistar](https://github.com/zhanglistar)).
+* Extract non intersecting parts ranges from MergeTree table during FINAL processing. That way we can avoid additional FINAL logic for this non intersecting parts ranges. In case when amount of duplicate values with same primary key is low, performance will be almost the same as without FINAL. Improve reading performance for MergeTree FINAL when `do_not_merge_across_partitions_select_final` setting is set. [#58120](https://github.com/ClickHouse/ClickHouse/pull/58120) ([Maksim Kita](https://github.com/kitaisreal)).
+* MergeTree automatically derive `do_not_merge_across_partitions_select_final` setting if partition key expression contains only columns from primary key expression. [#58218](https://github.com/ClickHouse/ClickHouse/pull/58218) ([Maksim Kita](https://github.com/kitaisreal)).
+* Speedup MIN and MAX for native types. [#58231](https://github.com/ClickHouse/ClickHouse/pull/58231) ([Raúl Marín](https://github.com/Algunenano)).
+
+#### Improvement
+* Make inserts into distributed tables handle updated cluster configuration properly. When the list of cluster nodes is dynamically updated, the Directory Monitor of the distribution table cannot sense the new node, and the Directory Monitor must be re-noded to sense it. [#42826](https://github.com/ClickHouse/ClickHouse/pull/42826) ([zhongyuankai](https://github.com/zhongyuankai)).
+* Replace --no-system-tables with loading virtual tables of system database lazily. [#55271](https://github.com/ClickHouse/ClickHouse/pull/55271) ([Azat Khuzhin](https://github.com/azat)).
+* Clickhouse-test print case sn, current time and case name in one test case. [#55710](https://github.com/ClickHouse/ClickHouse/pull/55710) ([guoxiaolong](https://github.com/guoxiaolongzte)).
+* Do not allow creating replicated table with inconsistent merge params. [#56833](https://github.com/ClickHouse/ClickHouse/pull/56833) ([Duc Canh Le](https://github.com/canhld94)).
+* Implement SLRU cache policy for filesystem cache. [#57076](https://github.com/ClickHouse/ClickHouse/pull/57076) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Show uncompressed size in `system.tables`, obtained from data parts' checksums [#56618](https://github.com/ClickHouse/ClickHouse/issues/56618). [#57186](https://github.com/ClickHouse/ClickHouse/pull/57186) ([Chen Lixiang](https://github.com/chenlx0)).
+* Add `skip_unavailable_shards` as a setting for `Distributed` tables that is similar to the corresponding query-level setting. Closes [#43666](https://github.com/ClickHouse/ClickHouse/issues/43666). [#57218](https://github.com/ClickHouse/ClickHouse/pull/57218) ([Gagan Goel](https://github.com/tntnatbry)).
+* Function `substring()` (aliases: `substr`, `mid`) can now be used with `Enum` types. Previously, the first function argument had to be a value of type `String` or `FixedString`. This improves compatibility with 3rd party tools such as Tableau via MySQL interface. [#57277](https://github.com/ClickHouse/ClickHouse/pull/57277) ([Serge Klochkov](https://github.com/slvrtrn)).
+* Better hints when a table doesn't exist. [#57342](https://github.com/ClickHouse/ClickHouse/pull/57342) ([Bharat Nallan](https://github.com/bharatnc)).
+* Allow to overwrite `max_partition_size_to_drop` and `max_table_size_to_drop` server settings in query time. [#57452](https://github.com/ClickHouse/ClickHouse/pull/57452) ([Jordi Villar](https://github.com/jrdi)).
+* Add support for read-only flag when connecting to the ZooKeeper server (fixes [#53749](https://github.com/ClickHouse/ClickHouse/issues/53749)). [#57479](https://github.com/ClickHouse/ClickHouse/pull/57479) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Fix possible distributed sends stuck due to "No such file or directory" (during recovering batch from disk). Fix possible issues with `error_count` from `system.distribution_queue` (in case of `distributed_directory_monitor_max_sleep_time_ms` >5min). Introduce profile event to track async INSERT failures - `DistributedAsyncInsertionFailures`. [#57480](https://github.com/ClickHouse/ClickHouse/pull/57480) ([Azat Khuzhin](https://github.com/azat)).
+* The limit for the number of connections per endpoint for background fetches was raised from `15` to the value of `background_fetches_pool_size` setting. - MergeTree-level setting `replicated_max_parallel_fetches_for_host` became obsolete - MergeTree-level settings `replicated_fetches_http_connection_timeout`, `replicated_fetches_http_send_timeout` and `replicated_fetches_http_receive_timeout` are moved to the Server-level. - Setting `keep_alive_timeout` is added to the list of Server-level settings. [#57523](https://github.com/ClickHouse/ClickHouse/pull/57523) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* It is now possible to refer to ALIAS column in index (non-primary-key) definitions (issue [#55650](https://github.com/ClickHouse/ClickHouse/issues/55650)). Example: `CREATE TABLE tab(col UInt32, col_alias ALIAS col + 1, INDEX idx (col_alias) TYPE minmax) ENGINE = MergeTree ORDER BY col;`. [#57546](https://github.com/ClickHouse/ClickHouse/pull/57546) ([Robert Schulze](https://github.com/rschu1ze)).
+* Function `format()` now supports arbitrary argument types (instead of only `String` and `FixedString` arguments). This is important to calculate `SELECT format('The {0} to all questions is {1}', 'answer', 42)`. [#57549](https://github.com/ClickHouse/ClickHouse/pull/57549) ([Robert Schulze](https://github.com/rschu1ze)).
+* Support PostgreSQL generated columns and default column values in `MaterializedPostgreSQL`. Closes [#40449](https://github.com/ClickHouse/ClickHouse/issues/40449). [#57568](https://github.com/ClickHouse/ClickHouse/pull/57568) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Allow to apply some filesystem cache config settings changes without server restart. [#57578](https://github.com/ClickHouse/ClickHouse/pull/57578) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Handle sigabrt case when getting PostgreSQl table structure with empty array. [#57618](https://github.com/ClickHouse/ClickHouse/pull/57618) ([Mike Kot (Михаил Кот)](https://github.com/myrrc)).
+* Allows to use the `date_trunc()` function with the first argument not depending on the case of it. Both cases are now supported: `SELECT date_trunc('day', now())` and `SELECT date_trunc('DAY', now())`. [#57624](https://github.com/ClickHouse/ClickHouse/pull/57624) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* Expose the total number of errors occurred since last server as a `ClickHouseErrorMetric_ALL` metric. [#57627](https://github.com/ClickHouse/ClickHouse/pull/57627) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Allow nodes in config with from_env/from_zk and non empty element with replace=1. [#57628](https://github.com/ClickHouse/ClickHouse/pull/57628) ([Azat Khuzhin](https://github.com/azat)).
+* Generate malformed output that cannot be parsed as JSON. [#57646](https://github.com/ClickHouse/ClickHouse/pull/57646) ([Julia Kartseva](https://github.com/jkartseva)).
+* Consider lightweight deleted rows when selecting parts to merge if enabled. [#57648](https://github.com/ClickHouse/ClickHouse/pull/57648) ([Zhuo Qiu](https://github.com/jewelzqiu)).
+* Make querying system.filesystem_cache not memory intensive. [#57687](https://github.com/ClickHouse/ClickHouse/pull/57687) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Allow IPv6 to UInt128 conversion and binary arithmetic. [#57707](https://github.com/ClickHouse/ClickHouse/pull/57707) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* Support negative positional arguments. Closes [#57736](https://github.com/ClickHouse/ClickHouse/issues/57736). [#57741](https://github.com/ClickHouse/ClickHouse/pull/57741) ([flynn](https://github.com/ucasfl)).
+* Add a setting for `async inserts deduplication cache` -- how long we wait for cache update. Deprecate setting `async_block_ids_cache_min_update_interval_ms`. Now cache is updated only in case of conflicts. [#57743](https://github.com/ClickHouse/ClickHouse/pull/57743) ([alesapin](https://github.com/alesapin)).
+* `sleep()` function now can be cancelled with `KILL QUERY`. [#57746](https://github.com/ClickHouse/ClickHouse/pull/57746) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Slightly better inference of unnamed tupes in JSON formats. [#57751](https://github.com/ClickHouse/ClickHouse/pull/57751) ([Kruglov Pavel](https://github.com/Avogar)).
+* Refactor UserDefinedSQL* classes to make it possible to add SQL UDF storages which are different from ZooKeeper and Disk. [#57752](https://github.com/ClickHouse/ClickHouse/pull/57752) ([Natasha Chizhonkova](https://github.com/chizhonkova)).
+* Forbid `CREATE TABLE ... AS SELECT` queries for Replicated table engines in Replicated database because they are broken. Reference [#35408](https://github.com/ClickHouse/ClickHouse/issues/35408). [#57796](https://github.com/ClickHouse/ClickHouse/pull/57796) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix and improve transform query for external database, we should recursively obtain all compatible predicates. [#57888](https://github.com/ClickHouse/ClickHouse/pull/57888) ([flynn](https://github.com/ucasfl)).
+* Support dynamic reloading of filesystem cache size. Closes [#57866](https://github.com/ClickHouse/ClickHouse/issues/57866). [#57897](https://github.com/ClickHouse/ClickHouse/pull/57897) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix system.stack_trace for threads with blocked SIGRTMIN. [#57907](https://github.com/ClickHouse/ClickHouse/pull/57907) ([Azat Khuzhin](https://github.com/azat)).
+* Added a new setting `readonly` which can be used to specify a s3 disk is read only. It can be useful to create a table with read only `s3_plain` type disk. [#57977](https://github.com/ClickHouse/ClickHouse/pull/57977) ([Pengyuan Bian](https://github.com/bianpengyuan)).
+* Support keeper failures in quorum check. [#57986](https://github.com/ClickHouse/ClickHouse/pull/57986) ([Raúl Marín](https://github.com/Algunenano)).
+* Add max/peak RSS (`MemoryResidentMax`) into system.asynchronous_metrics. [#58095](https://github.com/ClickHouse/ClickHouse/pull/58095) ([Azat Khuzhin](https://github.com/azat)).
+* Fix system.stack_trace for threads with blocked SIGRTMIN (and also send signal to the threads only if it is not blocked to avoid waiting `storage_system_stack_trace_pipe_read_timeout_ms` when it does not make any sense). [#58136](https://github.com/ClickHouse/ClickHouse/pull/58136) ([Azat Khuzhin](https://github.com/azat)).
+* This PR allows users to use s3 links (`https://` and `s3://`) without mentioning region if it's not default. Also find the correct region if the user mentioned the wrong one. ### Documentation entry for user-facing changes. [#58148](https://github.com/ClickHouse/ClickHouse/pull/58148) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* `clickhouse-format --obfuscate` will know about Settings, MergeTreeSettings, and time zones and keep their names unchanged. [#58179](https://github.com/ClickHouse/ClickHouse/pull/58179) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Added explicit `finalize()` function in `ZipArchiveWriter`. Simplify too complicated code in `ZipArchiveWriter`. This PR fixes [#58074](https://github.com/ClickHouse/ClickHouse/issues/58074). [#58202](https://github.com/ClickHouse/ClickHouse/pull/58202) ([Vitaly Baranov](https://github.com/vitlibar)).
+* The primary key analysis in MergeTree tables will now be applied to predicates that include the virtual column `_part_offset` (optionally with `_part`). This feature can serve as a poor man's secondary index. [#58224](https://github.com/ClickHouse/ClickHouse/pull/58224) ([Amos Bird](https://github.com/amosbird)).
+* Make caches with the same path use the same cache objects. This behaviour existed before, but was broken in https://github.com/ClickHouse/ClickHouse/pull/48805 (in 23.4). If such caches with the same path have different set of cache settings, an exception will be thrown, that this is not allowed. [#58264](https://github.com/ClickHouse/ClickHouse/pull/58264) ([Kseniia Sumarokova](https://github.com/kssenii)).
+
+#### Build/Testing/Packaging Improvement
+* Allow usage of Azure-related table engines/functions on macOS. [#51866](https://github.com/ClickHouse/ClickHouse/pull/51866) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* ClickHouse Fast Test now uses Musl instead of GLibc. [#57711](https://github.com/ClickHouse/ClickHouse/pull/57711) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Run ClickBench for every commit. This closes [#57708](https://github.com/ClickHouse/ClickHouse/issues/57708). [#57712](https://github.com/ClickHouse/ClickHouse/pull/57712) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### Bug Fix (user-visible misbehavior in an official stable release)
+
+* Fixed a sorting order breakage in TTL GROUP BY [#49103](https://github.com/ClickHouse/ClickHouse/pull/49103) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* fix: split lttb bucket strategy, first bucket and last bucket should only contain single point [#57003](https://github.com/ClickHouse/ClickHouse/pull/57003) ([FFish](https://github.com/wxybear)).
+* Fix possible deadlock in Template format during sync after error [#57004](https://github.com/ClickHouse/ClickHouse/pull/57004) ([Kruglov Pavel](https://github.com/Avogar)).
+* Fix early stop while parsing file with skipping lots of errors [#57006](https://github.com/ClickHouse/ClickHouse/pull/57006) ([Kruglov Pavel](https://github.com/Avogar)).
+* Prevent dictionary's ACL bypass via dictionary() table function [#57362](https://github.com/ClickHouse/ClickHouse/pull/57362) ([Salvatore Mesoraca](https://github.com/aiven-sal)).
+* Fix another case of non-ready set. [#57423](https://github.com/ClickHouse/ClickHouse/pull/57423) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix several issues regarding PostgreSQL `array_ndims` usage. [#57436](https://github.com/ClickHouse/ClickHouse/pull/57436) ([Ryan Jacobs](https://github.com/ryanmjacobs)).
+* Fix RWLock inconsistency after write lock timeout [#57454](https://github.com/ClickHouse/ClickHouse/pull/57454) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix: don't exclude ephemeral column when building pushing to view chain [#57461](https://github.com/ClickHouse/ClickHouse/pull/57461) ([Yakov Olkhovskiy](https://github.com/yakov-olkhovskiy)).
+* MaterializedPostgreSQL: fix issue [#41922](https://github.com/ClickHouse/ClickHouse/issues/41922), add test for [#41923](https://github.com/ClickHouse/ClickHouse/issues/41923) [#57515](https://github.com/ClickHouse/ClickHouse/pull/57515) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Ignore ON CLUSTER clause in grant/revoke queries for management of replicated access entities.  [#57538](https://github.com/ClickHouse/ClickHouse/pull/57538) ([MikhailBurdukov](https://github.com/MikhailBurdukov)).
+* Fix crash in clickhouse-local [#57553](https://github.com/ClickHouse/ClickHouse/pull/57553) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Materialize block in HashJoin for Type::EMPTY [#57564](https://github.com/ClickHouse/ClickHouse/pull/57564) ([vdimir](https://github.com/vdimir)).
+* Fix possible segfault in PostgreSQLSource [#57567](https://github.com/ClickHouse/ClickHouse/pull/57567) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix type correction in HashJoin for nested low cardinality [#57614](https://github.com/ClickHouse/ClickHouse/pull/57614) ([vdimir](https://github.com/vdimir)).
+* Avoid hangs of system.stack_trace by correctly prohibit parallel read from it [#57641](https://github.com/ClickHouse/ClickHouse/pull/57641) ([Azat Khuzhin](https://github.com/azat)).
+* Fix SIGSEGV for aggregation of sparse columns with any() RESPECT NULL [#57710](https://github.com/ClickHouse/ClickHouse/pull/57710) ([Azat Khuzhin](https://github.com/azat)).
+* Fix unary operators parsing [#57713](https://github.com/ClickHouse/ClickHouse/pull/57713) ([Nikolay Degterinsky](https://github.com/evillique)).
+* Fix RWLock inconsistency after write lock timeout (again) [#57733](https://github.com/ClickHouse/ClickHouse/pull/57733) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Table engine MaterializedPostgreSQL fix dependency loading [#57754](https://github.com/ClickHouse/ClickHouse/pull/57754) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix retries for disconnected nodes for BACKUP/RESTORE ON CLUSTER [#57764](https://github.com/ClickHouse/ClickHouse/pull/57764) ([Vitaly Baranov](https://github.com/vitlibar)).
+* Fix bug window functions: revert [#39631](https://github.com/ClickHouse/ClickHouse/issues/39631) [#57766](https://github.com/ClickHouse/ClickHouse/pull/57766) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix result of external aggregation in case of partially materialized projection [#57790](https://github.com/ClickHouse/ClickHouse/pull/57790) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix merge in aggregation functions with `*Map` combinator [#57795](https://github.com/ClickHouse/ClickHouse/pull/57795) ([Anton Popov](https://github.com/CurtizJ)).
+* Disable system.kafka_consumers by default (due to possible live memory leak) [#57822](https://github.com/ClickHouse/ClickHouse/pull/57822) ([Azat Khuzhin](https://github.com/azat)).
+* Fix low-cardinality keys support in MergeJoin [#57827](https://github.com/ClickHouse/ClickHouse/pull/57827) ([vdimir](https://github.com/vdimir)).
+* Create consumers for Kafka tables on fly (but keep them for some period since last used) [#57829](https://github.com/ClickHouse/ClickHouse/pull/57829) ([Azat Khuzhin](https://github.com/azat)).
+* InterpreterCreateQuery sample block fix [#57855](https://github.com/ClickHouse/ClickHouse/pull/57855) ([Maksim Kita](https://github.com/kitaisreal)).
+* bugfix: addresses_expr ignored for psql named collections [#57874](https://github.com/ClickHouse/ClickHouse/pull/57874) ([joelynch](https://github.com/joelynch)).
+* Fix invalid memory access in BLAKE3 (Rust) [#57876](https://github.com/ClickHouse/ClickHouse/pull/57876) ([Raúl Marín](https://github.com/Algunenano)).
+* Resurrect `arrayFold()` [#57879](https://github.com/ClickHouse/ClickHouse/pull/57879) ([Robert Schulze](https://github.com/rschu1ze)).
+* Normalize function names in CREATE INDEX [#57906](https://github.com/ClickHouse/ClickHouse/pull/57906) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix handling of unavailable replicas before first request happened [#57933](https://github.com/ClickHouse/ClickHouse/pull/57933) ([Nikita Taranov](https://github.com/nickitat)).
+* Fix literal alias misclassification [#57988](https://github.com/ClickHouse/ClickHouse/pull/57988) ([Chen768959](https://github.com/Chen768959)).
+* Revert "Fix bug window functions: revert [#39631](https://github.com/ClickHouse/ClickHouse/issues/39631)" [#58031](https://github.com/ClickHouse/ClickHouse/pull/58031) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Fix invalid preprocessing on Keeper [#58069](https://github.com/ClickHouse/ClickHouse/pull/58069) ([Antonio Andelic](https://github.com/antonio2368)).
+* Fix Integer overflow in Poco::UTF32Encoding [#58073](https://github.com/ClickHouse/ClickHouse/pull/58073) ([Andrey Fedotov](https://github.com/anfedotoff)).
+* Fix parallel replicas in presence of a scalar subquery with a big integer value [#58118](https://github.com/ClickHouse/ClickHouse/pull/58118) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix `accurateCastOrNull` for out-of-range DateTime [#58139](https://github.com/ClickHouse/ClickHouse/pull/58139) ([Andrey Zvonov](https://github.com/zvonand)).
+* Fix possible PARAMETER_OUT_OF_BOUND error during subcolumns reading from wide part in MergeTree [#58175](https://github.com/ClickHouse/ClickHouse/pull/58175) ([Kruglov Pavel](https://github.com/Avogar)).
+* Remove parallel parsing for JSONCompactEachRow [#58181](https://github.com/ClickHouse/ClickHouse/pull/58181) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* fix CREATE VIEW hang [#58220](https://github.com/ClickHouse/ClickHouse/pull/58220) ([Tao Wang](https://github.com/wangtZJU)).
+* Fix parallel parsing for JSONCompactEachRow [#58250](https://github.com/ClickHouse/ClickHouse/pull/58250) ([Kruglov Pavel](https://github.com/Avogar)).
+
+#### NO CL ENTRY
+
+* NO CL ENTRY:  'Revert "Revert "Update Sentry""'. [#57694](https://github.com/ClickHouse/ClickHouse/pull/57694) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Fix RWLock inconsistency after write lock timeout"'. [#57730](https://github.com/ClickHouse/ClickHouse/pull/57730) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "improve CI with digest for docker, build and test jobs"'. [#57903](https://github.com/ClickHouse/ClickHouse/pull/57903) ([Max K.](https://github.com/mkaynov)).
+* NO CL ENTRY:  'Reapply "improve CI with digest for docker, build and test jobs"'. [#57904](https://github.com/ClickHouse/ClickHouse/pull/57904) ([Max K.](https://github.com/mkaynov)).
+* NO CL ENTRY:  'Revert "Merge pull request [#56573](https://github.com/ClickHouse/ClickHouse/issues/56573) from mkmkme/mkmkme/reload-config"'. [#57909](https://github.com/ClickHouse/ClickHouse/pull/57909) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Add system.dropped_tables_parts table"'. [#58022](https://github.com/ClickHouse/ClickHouse/pull/58022) ([Antonio Andelic](https://github.com/antonio2368)).
+* NO CL ENTRY:  'Revert "Consider lightweight deleted rows when selecting parts to merge"'. [#58097](https://github.com/ClickHouse/ClickHouse/pull/58097) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Fix leftover processes/hangs in tests"'. [#58207](https://github.com/ClickHouse/ClickHouse/pull/58207) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Create consumers for Kafka tables on fly (but keep them for some period since last used)"'. [#58272](https://github.com/ClickHouse/ClickHouse/pull/58272) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* NO CL ENTRY:  'Revert "Implement punycode encoding/decoding"'. [#58277](https://github.com/ClickHouse/ClickHouse/pull/58277) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
+#### NOT FOR CHANGELOG / INSIGNIFICANT
+
+* Randomize more settings [#39663](https://github.com/ClickHouse/ClickHouse/pull/39663) ([Anton Popov](https://github.com/CurtizJ)).
+* Add more tests for `compile_expressions` [#51113](https://github.com/ClickHouse/ClickHouse/pull/51113) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* [RFC] Correctly wait background threads [#52717](https://github.com/ClickHouse/ClickHouse/pull/52717) ([Azat Khuzhin](https://github.com/azat)).
+* improve CI with digest for docker, build and test jobs [#56317](https://github.com/ClickHouse/ClickHouse/pull/56317) ([Max K.](https://github.com/mkaynov)).
+* Prepare the introduction of more keeper faults [#56917](https://github.com/ClickHouse/ClickHouse/pull/56917) ([Raúl Marín](https://github.com/Algunenano)).
+* Analyzer: Fix assert in tryReplaceAndEqualsChainsWithConstant [#57139](https://github.com/ClickHouse/ClickHouse/pull/57139) ([vdimir](https://github.com/vdimir)).
+* Check what will happen if we build ClickHouse with Musl [#57180](https://github.com/ClickHouse/ClickHouse/pull/57180) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* support memory soft limit for keeper [#57271](https://github.com/ClickHouse/ClickHouse/pull/57271) ([Han Fei](https://github.com/hanfei1991)).
+* Randomize disabled optimizations in CI [#57315](https://github.com/ClickHouse/ClickHouse/pull/57315) ([Raúl Marín](https://github.com/Algunenano)).
+* Don't throw if noop when dropping database replica in batch [#57337](https://github.com/ClickHouse/ClickHouse/pull/57337) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Better JSON -> JSONEachRow fallback without catching exceptions [#57364](https://github.com/ClickHouse/ClickHouse/pull/57364) ([Kruglov Pavel](https://github.com/Avogar)).
+* Add tests for [#48496](https://github.com/ClickHouse/ClickHouse/issues/48496) [#57414](https://github.com/ClickHouse/ClickHouse/pull/57414) ([Raúl Marín](https://github.com/Algunenano)).
+* Add profile event for cache lookup in `ThreadPoolRemoteFSReader` [#57437](https://github.com/ClickHouse/ClickHouse/pull/57437) ([Nikita Taranov](https://github.com/nickitat)).
+* Remove select() usage [#57467](https://github.com/ClickHouse/ClickHouse/pull/57467) ([Igor Nikonov](https://github.com/devcrafter)).
+* Parallel replicas: friendly settings [#57542](https://github.com/ClickHouse/ClickHouse/pull/57542) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix formatting string prompt error [#57569](https://github.com/ClickHouse/ClickHouse/pull/57569) ([skyoct](https://github.com/skyoct)).
+* Tune CI scale up/down multipliers [#57572](https://github.com/ClickHouse/ClickHouse/pull/57572) ([Max K.](https://github.com/mkaynov)).
+* Revert "Revert "Implemented series period detect method using pocketfft lib"" [#57574](https://github.com/ClickHouse/ClickHouse/pull/57574) ([Bhavna Jindal](https://github.com/bhavnajindal)).
+* Correctly handle errors during opening query in editor in client [#57587](https://github.com/ClickHouse/ClickHouse/pull/57587) ([Azat Khuzhin](https://github.com/azat)).
+* Add a test for [#55251](https://github.com/ClickHouse/ClickHouse/issues/55251) [#57588](https://github.com/ClickHouse/ClickHouse/pull/57588) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Add a test for [#48039](https://github.com/ClickHouse/ClickHouse/issues/48039) [#57593](https://github.com/ClickHouse/ClickHouse/pull/57593) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update CHANGELOG.md [#57594](https://github.com/ClickHouse/ClickHouse/pull/57594) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version after release [#57595](https://github.com/ClickHouse/ClickHouse/pull/57595) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Update version_date.tsv and changelogs after v23.11.1.2711-stable [#57597](https://github.com/ClickHouse/ClickHouse/pull/57597) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Identify failed jobs in lambda and mark as steps=0 [#57600](https://github.com/ClickHouse/ClickHouse/pull/57600) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Fix flaky test: distinct in order with analyzer [#57606](https://github.com/ClickHouse/ClickHouse/pull/57606) ([Igor Nikonov](https://github.com/devcrafter)).
+* CHJIT add assembly printer [#57610](https://github.com/ClickHouse/ClickHouse/pull/57610) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix parsing virtual hosted S3 URI in clickhouse_backupview script [#57612](https://github.com/ClickHouse/ClickHouse/pull/57612) ([Daniel Pozo Escalona](https://github.com/danipozo)).
+* Fix docs for `fileCluster` [#57613](https://github.com/ClickHouse/ClickHouse/pull/57613) ([Andrey Zvonov](https://github.com/zvonand)).
+* Analyzer: Fix logical error in MultiIfToIfPass [#57622](https://github.com/ClickHouse/ClickHouse/pull/57622) ([vdimir](https://github.com/vdimir)).
+* Throw more clear exception [#57626](https://github.com/ClickHouse/ClickHouse/pull/57626) ([alesapin](https://github.com/alesapin)).
+* Fix "logs and exception messages formatting", part 1 [#57630](https://github.com/ClickHouse/ClickHouse/pull/57630) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix "logs and exception messages formatting", part 2 [#57632](https://github.com/ClickHouse/ClickHouse/pull/57632) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix "logs and exception messages formatting", part 3 [#57633](https://github.com/ClickHouse/ClickHouse/pull/57633) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix "logs and exception messages formatting", part 4 [#57634](https://github.com/ClickHouse/ClickHouse/pull/57634) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove bad test (1) [#57636](https://github.com/ClickHouse/ClickHouse/pull/57636) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove bad test (2) [#57637](https://github.com/ClickHouse/ClickHouse/pull/57637) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* ClickHouse Cloud promotion [#57638](https://github.com/ClickHouse/ClickHouse/pull/57638) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Remove bad test (3) [#57639](https://github.com/ClickHouse/ClickHouse/pull/57639) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Remove bad test (4) [#57640](https://github.com/ClickHouse/ClickHouse/pull/57640) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Random changes in random files [#57642](https://github.com/ClickHouse/ClickHouse/pull/57642) ([Nikita Mikhaylov](https://github.com/nikitamikhaylov)).
+* Merge half of [#51113](https://github.com/ClickHouse/ClickHouse/issues/51113) [#57643](https://github.com/ClickHouse/ClickHouse/pull/57643) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Analyzer: Fix JOIN ON true with join_use_nulls [#57662](https://github.com/ClickHouse/ClickHouse/pull/57662) ([vdimir](https://github.com/vdimir)).
+* Pin alpine version of integration tests helper container [#57669](https://github.com/ClickHouse/ClickHouse/pull/57669) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Add support for system.stack_trace filtering optimizations for analyzer [#57682](https://github.com/ClickHouse/ClickHouse/pull/57682) ([Azat Khuzhin](https://github.com/azat)).
+* test for [#33308](https://github.com/ClickHouse/ClickHouse/issues/33308) [#57693](https://github.com/ClickHouse/ClickHouse/pull/57693) ([Denny Crane](https://github.com/den-crane)).
+* support keeper memory soft limit ratio [#57699](https://github.com/ClickHouse/ClickHouse/pull/57699) ([Han Fei](https://github.com/hanfei1991)).
+* Fix test_dictionaries_update_and_reload/test.py::test_reload_while_loading flakiness [#57714](https://github.com/ClickHouse/ClickHouse/pull/57714) ([Azat Khuzhin](https://github.com/azat)).
+* Tune autoscale to scale for single job in the queue [#57742](https://github.com/ClickHouse/ClickHouse/pull/57742) ([Max K.](https://github.com/mkaynov)).
+* Tune network memory for dockerhub proxy hosts [#57744](https://github.com/ClickHouse/ClickHouse/pull/57744) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Parallel replicas: announcement response handling improvement [#57749](https://github.com/ClickHouse/ClickHouse/pull/57749) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix building Rust with Musl [#57756](https://github.com/ClickHouse/ClickHouse/pull/57756) ([Azat Khuzhin](https://github.com/azat)).
+* Fix flaky test_parallel_replicas_distributed_read_from_all [#57757](https://github.com/ClickHouse/ClickHouse/pull/57757) ([Igor Nikonov](https://github.com/devcrafter)).
+* Minor refactoring of toStartOfInterval() [#57761](https://github.com/ClickHouse/ClickHouse/pull/57761) ([Robert Schulze](https://github.com/rschu1ze)).
+* Don't run test 02919_skip_lots_of_parsing_errors on aarch64 [#57762](https://github.com/ClickHouse/ClickHouse/pull/57762) ([Kruglov Pavel](https://github.com/Avogar)).
+* More respect to `min_number_of_marks` in `ParallelReplicasReadingCoordinator` [#57763](https://github.com/ClickHouse/ClickHouse/pull/57763) ([Nikita Taranov](https://github.com/nickitat)).
+* SerializationString reduce memory usage [#57787](https://github.com/ClickHouse/ClickHouse/pull/57787) ([Maksim Kita](https://github.com/kitaisreal)).
+* Fix ThreadSanitizer data race in librdkafka  [#57791](https://github.com/ClickHouse/ClickHouse/pull/57791) ([Ilya Golshtein](https://github.com/ilejn)).
+* Rename `system.async_loader` into `system.asynchronous_loader` [#57793](https://github.com/ClickHouse/ClickHouse/pull/57793) ([Sergei Trifonov](https://github.com/serxa)).
+* Set replica number to its position in cluster definition [#57800](https://github.com/ClickHouse/ClickHouse/pull/57800) ([Nikita Taranov](https://github.com/nickitat)).
+* fix clickhouse-client invocation in 02327_capnproto_protobuf_empty_messages [#57804](https://github.com/ClickHouse/ClickHouse/pull/57804) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Fix flaky test_parallel_replicas_over_distributed [#57809](https://github.com/ClickHouse/ClickHouse/pull/57809) ([Igor Nikonov](https://github.com/devcrafter)).
+* Revert [#57741](https://github.com/ClickHouse/ClickHouse/issues/57741) [#57811](https://github.com/ClickHouse/ClickHouse/pull/57811) ([Raúl Marín](https://github.com/Algunenano)).
+* Dumb down `substring()` tests [#57821](https://github.com/ClickHouse/ClickHouse/pull/57821) ([Robert Schulze](https://github.com/rschu1ze)).
+* Update version_date.tsv and changelogs after v23.11.2.11-stable [#57824](https://github.com/ClickHouse/ClickHouse/pull/57824) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Fix 02906_force_optimize_projection_name [#57826](https://github.com/ClickHouse/ClickHouse/pull/57826) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* ClickBench: slightly better [#57831](https://github.com/ClickHouse/ClickHouse/pull/57831) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix 02932_kill_query_sleep flakiness [#57849](https://github.com/ClickHouse/ClickHouse/pull/57849) ([Azat Khuzhin](https://github.com/azat)).
+* Revert "Replace --no-system-tables with loading virtual tables of system database lazily" [#57851](https://github.com/ClickHouse/ClickHouse/pull/57851) ([Azat Khuzhin](https://github.com/azat)).
+* Fix memory leak in StorageHDFS [#57860](https://github.com/ClickHouse/ClickHouse/pull/57860) ([Andrey Zvonov](https://github.com/zvonand)).
+* Remove hardcoded clickhouse-client invocations from tests [#57861](https://github.com/ClickHouse/ClickHouse/pull/57861) ([Mikhail Koviazin](https://github.com/mkmkme)).
+* Follow up to [#57568](https://github.com/ClickHouse/ClickHouse/issues/57568) [#57863](https://github.com/ClickHouse/ClickHouse/pull/57863) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Fix assertion in HashJoin [#57873](https://github.com/ClickHouse/ClickHouse/pull/57873) ([vdimir](https://github.com/vdimir)).
+* More efficient constructor for SerializationEnum [#57887](https://github.com/ClickHouse/ClickHouse/pull/57887) ([Duc Canh Le](https://github.com/canhld94)).
+* Fix test_unset_skip_unavailable_shards [#57895](https://github.com/ClickHouse/ClickHouse/pull/57895) ([Raúl Marín](https://github.com/Algunenano)).
+* Add argument to fill the gap in cherry-pick [#57896](https://github.com/ClickHouse/ClickHouse/pull/57896) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Delete debug logging in OutputFormatWithUTF8ValidationAdaptor [#57899](https://github.com/ClickHouse/ClickHouse/pull/57899) ([Kruglov Pavel](https://github.com/Avogar)).
+* Remove heavy rust stable toolchain [#57905](https://github.com/ClickHouse/ClickHouse/pull/57905) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Improvements for 00002_log_and_exception_messages_formatting [#57910](https://github.com/ClickHouse/ClickHouse/pull/57910) ([Raúl Marín](https://github.com/Algunenano)).
+* Update CHANGELOG.md [#57911](https://github.com/ClickHouse/ClickHouse/pull/57911) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* remove cruft from TablesLoader [#57938](https://github.com/ClickHouse/ClickHouse/pull/57938) ([Bharat Nallan](https://github.com/bharatnc)).
+* Fix `/dashboard` work with passwords [#57948](https://github.com/ClickHouse/ClickHouse/pull/57948) ([Sergei Trifonov](https://github.com/serxa)).
+* Remove wrong test [#57950](https://github.com/ClickHouse/ClickHouse/pull/57950) ([Sergei Trifonov](https://github.com/serxa)).
+* Fix docker image for integration tests (fixes CI) [#57952](https://github.com/ClickHouse/ClickHouse/pull/57952) ([Azat Khuzhin](https://github.com/azat)).
+* Remove C++ templates (normalizeQuery) [#57963](https://github.com/ClickHouse/ClickHouse/pull/57963) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* A small fix for dashboard [#57964](https://github.com/ClickHouse/ClickHouse/pull/57964) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Always use `pread` for reading cache segments [#57970](https://github.com/ClickHouse/ClickHouse/pull/57970) ([Nikita Taranov](https://github.com/nickitat)).
+* Improve some tests [#57973](https://github.com/ClickHouse/ClickHouse/pull/57973) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Revert "Merge pull request [#57907](https://github.com/ClickHouse/ClickHouse/issues/57907) from azat/system.stack_trace-rt_tgsigqueueinfo" [#57974](https://github.com/ClickHouse/ClickHouse/pull/57974) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add a test for [#49708](https://github.com/ClickHouse/ClickHouse/issues/49708) [#57979](https://github.com/ClickHouse/ClickHouse/pull/57979) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix style-check checkout head-ref [#57989](https://github.com/ClickHouse/ClickHouse/pull/57989) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* refine error message [#57991](https://github.com/ClickHouse/ClickHouse/pull/57991) ([Han Fei](https://github.com/hanfei1991)).
+* CI for docs only fix [#57992](https://github.com/ClickHouse/ClickHouse/pull/57992) ([Max K.](https://github.com/mkaynov)).
+* Replace rust's BLAKE3 with llvm's implementation [#57994](https://github.com/ClickHouse/ClickHouse/pull/57994) ([Raúl Marín](https://github.com/Algunenano)).
+* Better trivial count optimization for storage `Merge` [#57996](https://github.com/ClickHouse/ClickHouse/pull/57996) ([Anton Popov](https://github.com/CurtizJ)).
+* enhanced docs for `date_trunc()` [#58000](https://github.com/ClickHouse/ClickHouse/pull/58000) ([Yarik Briukhovetskyi](https://github.com/yariks5s)).
+* CI: add needs_changed_files flag for pr_info [#58003](https://github.com/ClickHouse/ClickHouse/pull/58003) ([Max K.](https://github.com/mkaynov)).
+* more messages in ci [#58007](https://github.com/ClickHouse/ClickHouse/pull/58007) ([Sema Checherinda](https://github.com/CheSema)).
+* Test parallel replicas with force_primary_key setting [#58010](https://github.com/ClickHouse/ClickHouse/pull/58010) ([Igor Nikonov](https://github.com/devcrafter)).
+* Update 00002_log_and_exception_messages_formatting.sql [#58012](https://github.com/ClickHouse/ClickHouse/pull/58012) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix rare race in external sort/aggregation with temporary data in cache [#58013](https://github.com/ClickHouse/ClickHouse/pull/58013) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix segfault in FuzzJSON engine [#58015](https://github.com/ClickHouse/ClickHouse/pull/58015) ([Julia Kartseva](https://github.com/jkartseva)).
+* fix freebsd build [#58019](https://github.com/ClickHouse/ClickHouse/pull/58019) ([Julia Kartseva](https://github.com/jkartseva)).
+* Rename canUseParallelReplicas to canUseTaskBasedParallelReplicas [#58025](https://github.com/ClickHouse/ClickHouse/pull/58025) ([Raúl Marín](https://github.com/Algunenano)).
+* Remove fixed tests from analyzer_tech_debt.txt [#58028](https://github.com/ClickHouse/ClickHouse/pull/58028) ([Raúl Marín](https://github.com/Algunenano)).
+* More verbose errors on 00002_log_and_exception_messages_formatting [#58037](https://github.com/ClickHouse/ClickHouse/pull/58037) ([Raúl Marín](https://github.com/Algunenano)).
+* Make window insert result into constant [#58045](https://github.com/ClickHouse/ClickHouse/pull/58045) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* CI: Happy new year [#58046](https://github.com/ClickHouse/ClickHouse/pull/58046) ([Raúl Marín](https://github.com/Algunenano)).
+* Follow up for [#57691](https://github.com/ClickHouse/ClickHouse/issues/57691) [#58048](https://github.com/ClickHouse/ClickHouse/pull/58048) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* always run ast_fuzz and sqllancer [#58049](https://github.com/ClickHouse/ClickHouse/pull/58049) ([Max K.](https://github.com/mkaynov)).
+* Add GH status for PR formating [#58050](https://github.com/ClickHouse/ClickHouse/pull/58050) ([Max K.](https://github.com/mkaynov)).
+* Small improvement for SystemLogBase [#58051](https://github.com/ClickHouse/ClickHouse/pull/58051) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Bump Azure to v1.6.0 [#58052](https://github.com/ClickHouse/ClickHouse/pull/58052) ([Robert Schulze](https://github.com/rschu1ze)).
+* Correct values for randomization [#58058](https://github.com/ClickHouse/ClickHouse/pull/58058) ([Anton Popov](https://github.com/CurtizJ)).
+* Non post request should be readonly [#58060](https://github.com/ClickHouse/ClickHouse/pull/58060) ([San](https://github.com/santrancisco)).
+* Revert "Merge pull request [#55710](https://github.com/ClickHouse/ClickHouse/issues/55710) from guoxiaolongzte/clickhouse-test… [#58066](https://github.com/ClickHouse/ClickHouse/pull/58066) ([Raúl Marín](https://github.com/Algunenano)).
+* fix typo in the test 02479 [#58072](https://github.com/ClickHouse/ClickHouse/pull/58072) ([Sema Checherinda](https://github.com/CheSema)).
+* Bump Azure to 1.7.2 [#58075](https://github.com/ClickHouse/ClickHouse/pull/58075) ([Robert Schulze](https://github.com/rschu1ze)).
+* Fix flaky test `02567_and_consistency` [#58076](https://github.com/ClickHouse/ClickHouse/pull/58076) ([Anton Popov](https://github.com/CurtizJ)).
+* Fix Tests Bugfix Validate Check [#58078](https://github.com/ClickHouse/ClickHouse/pull/58078) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Fix for nightly job for digest-ci [#58079](https://github.com/ClickHouse/ClickHouse/pull/58079) ([Max K.](https://github.com/mkaynov)).
+* Test for parallel replicas with remote() [#58081](https://github.com/ClickHouse/ClickHouse/pull/58081) ([Igor Nikonov](https://github.com/devcrafter)).
+* Minor cosmetic changes [#58092](https://github.com/ClickHouse/ClickHouse/pull/58092) ([Raúl Marín](https://github.com/Algunenano)).
+* Reintroduce OPTIMIZE CLEANUP as no-op [#58100](https://github.com/ClickHouse/ClickHouse/pull/58100) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add compatibility in the replication protocol for a removed feature [#58104](https://github.com/ClickHouse/ClickHouse/pull/58104) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Flaky 02922_analyzer_aggregate_nothing_type [#58105](https://github.com/ClickHouse/ClickHouse/pull/58105) ([Raúl Marín](https://github.com/Algunenano)).
+* Update version_date.tsv and changelogs after v23.11.3.23-stable [#58106](https://github.com/ClickHouse/ClickHouse/pull/58106) ([robot-clickhouse](https://github.com/robot-clickhouse)).
+* Limited CI on the master for docs only change [#58121](https://github.com/ClickHouse/ClickHouse/pull/58121) ([Max K.](https://github.com/mkaynov)).
+* style fix [#58125](https://github.com/ClickHouse/ClickHouse/pull/58125) ([Max K.](https://github.com/mkaynov)).
+* Support "do not test" label with ci.py [#58128](https://github.com/ClickHouse/ClickHouse/pull/58128) ([Max K.](https://github.com/mkaynov)).
+* Use the single images list for integration tests everywhere [#58130](https://github.com/ClickHouse/ClickHouse/pull/58130) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Disable parallel replicas with IN (subquery) [#58133](https://github.com/ClickHouse/ClickHouse/pull/58133) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix clang-tidy [#58134](https://github.com/ClickHouse/ClickHouse/pull/58134) ([Raúl Marín](https://github.com/Algunenano)).
+* Run build report check job on build failures, fix [#58135](https://github.com/ClickHouse/ClickHouse/pull/58135) ([Max K.](https://github.com/mkaynov)).
+* Fix dashboard legend sorting and rows number [#58151](https://github.com/ClickHouse/ClickHouse/pull/58151) ([Sergei Trifonov](https://github.com/serxa)).
+* Remove retryStrategy assignments overwritten in ClientFactory::create() [#58163](https://github.com/ClickHouse/ClickHouse/pull/58163) ([Daniel Pozo Escalona](https://github.com/danipozo)).
+* Helper improvements [#58164](https://github.com/ClickHouse/ClickHouse/pull/58164) ([Mikhail f. Shiryaev](https://github.com/Felixoid)).
+* Pass through exceptions for reading from S3 [#58165](https://github.com/ClickHouse/ClickHouse/pull/58165) ([Azat Khuzhin](https://github.com/azat)).
+* [RFC] Adjust all std::ios implementations in poco to set failbit/badbit by default [#58166](https://github.com/ClickHouse/ClickHouse/pull/58166) ([Azat Khuzhin](https://github.com/azat)).
+* Add bytes_uncompressed to system.part_log [#58167](https://github.com/ClickHouse/ClickHouse/pull/58167) ([Jordi Villar](https://github.com/jrdi)).
+* Update docker/test/stateful/run.sh [#58168](https://github.com/ClickHouse/ClickHouse/pull/58168) ([Kseniia Sumarokova](https://github.com/kssenii)).
+* Update 00165_jit_aggregate_functions.sql [#58169](https://github.com/ClickHouse/ClickHouse/pull/58169) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Update clickhouse-test [#58170](https://github.com/ClickHouse/ClickHouse/pull/58170) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Profile event 'ParallelReplicasUsedCount' [#58173](https://github.com/ClickHouse/ClickHouse/pull/58173) ([Igor Nikonov](https://github.com/devcrafter)).
+* Fix flaky test `02719_aggregate_with_empty_string_key` [#58176](https://github.com/ClickHouse/ClickHouse/pull/58176) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix [#58171](https://github.com/ClickHouse/ClickHouse/issues/58171) [#58177](https://github.com/ClickHouse/ClickHouse/pull/58177) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Add base backup name to system.backups and system.backup_log tables [#58178](https://github.com/ClickHouse/ClickHouse/pull/58178) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Fix use-after-move [#58182](https://github.com/ClickHouse/ClickHouse/pull/58182) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Looking at strange code [#58196](https://github.com/ClickHouse/ClickHouse/pull/58196) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix all Exception with missing arguments [#58198](https://github.com/ClickHouse/ClickHouse/pull/58198) ([Azat Khuzhin](https://github.com/azat)).
+* Fix leftover processes/hangs in tests [#58200](https://github.com/ClickHouse/ClickHouse/pull/58200) ([Azat Khuzhin](https://github.com/azat)).
+* Fix DWARFBlockInputFormat failing on DWARF 5 unit address ranges [#58204](https://github.com/ClickHouse/ClickHouse/pull/58204) ([Michael Kolupaev](https://github.com/al13n321)).
+* Fix error in archive reader [#58206](https://github.com/ClickHouse/ClickHouse/pull/58206) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Fix DWARFBlockInputFormat using wrong base address sometimes [#58208](https://github.com/ClickHouse/ClickHouse/pull/58208) ([Michael Kolupaev](https://github.com/al13n321)).
+* Add support for specifying query parameters in the command line in clickhouse-local [#58210](https://github.com/ClickHouse/ClickHouse/pull/58210) ([Pradeep Chhetri](https://github.com/chhetripradeep)).
+* Fix leftover processes/hangs in tests (resubmit) [#58213](https://github.com/ClickHouse/ClickHouse/pull/58213) ([Azat Khuzhin](https://github.com/azat)).
+* Add optimization for AND notEquals chain in logical expression optimizer [#58214](https://github.com/ClickHouse/ClickHouse/pull/58214) ([Kevin Mingtarja](https://github.com/kevinmingtarja)).
+* Fix syntax and doc [#58221](https://github.com/ClickHouse/ClickHouse/pull/58221) ([San](https://github.com/santrancisco)).
+* Cleanup some known short messages [#58226](https://github.com/ClickHouse/ClickHouse/pull/58226) ([Raúl Marín](https://github.com/Algunenano)).
+* Some code refactoring (was an attempt to improve build time, but failed) [#58237](https://github.com/ClickHouse/ClickHouse/pull/58237) ([Azat Khuzhin](https://github.com/azat)).
+* Fix perf test README [#58245](https://github.com/ClickHouse/ClickHouse/pull/58245) ([Raúl Marín](https://github.com/Algunenano)).
+* [Analyzer] Add test for [#57086](https://github.com/ClickHouse/ClickHouse/issues/57086) [#58249](https://github.com/ClickHouse/ClickHouse/pull/58249) ([Raúl Marín](https://github.com/Algunenano)).
+* Reintroduce compatibility with `is_deleted` on a syntax level [#58251](https://github.com/ClickHouse/ClickHouse/pull/58251) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+* Avoid throwing ABORTED on normal situations [#58252](https://github.com/ClickHouse/ClickHouse/pull/58252) ([Raúl Marín](https://github.com/Algunenano)).
+* Remove mayBenefitFromIndexForIn [#58265](https://github.com/ClickHouse/ClickHouse/pull/58265) ([Nikolai Kochetov](https://github.com/KochetovNicolai)).
+* Allow a few retries when committing a part during shutdown [#58269](https://github.com/ClickHouse/ClickHouse/pull/58269) ([Alexander Tokmakov](https://github.com/tavplubix)).
+* Revert [#58267](https://github.com/ClickHouse/ClickHouse/issues/58267) [#58274](https://github.com/ClickHouse/ClickHouse/pull/58274) ([Alexey Milovidov](https://github.com/alexey-milovidov)).
+
diff --git a/docs/en/development/build-cross-osx.md b/docs/en/development/build-cross-osx.md
index a04d676e92d..eddf24448c1 100644
--- a/docs/en/development/build-cross-osx.md
+++ b/docs/en/development/build-cross-osx.md
@@ -28,18 +28,20 @@ sudo apt-get install clang-17
 Let’s remember the path where we install `cctools` as ${CCTOOLS}
 
 ``` bash
+mkdir ~/cctools
 export CCTOOLS=$(cd ~/cctools && pwd)
-mkdir ${CCTOOLS}
 cd ${CCTOOLS}
 
-git clone --depth=1 https://github.com/tpoechtrager/apple-libtapi.git
+git clone https://github.com/tpoechtrager/apple-libtapi.git
 cd apple-libtapi
+git checkout 15dfc2a8c9a2a89d06ff227560a69f5265b692f9
 INSTALLPREFIX=${CCTOOLS} ./build.sh
 ./install.sh
 cd ..
 
-git clone --depth=1 https://github.com/tpoechtrager/cctools-port.git
+git clone https://github.com/tpoechtrager/cctools-port.git
 cd cctools-port/cctools
+git checkout 2a3e1c2a6ff54a30f898b70cfb9ba1692a55fad7
 ./configure --prefix=$(readlink -f ${CCTOOLS}) --with-libtapi=$(readlink -f ${CCTOOLS}) --target=x86_64-apple-darwin
 make install
 ```
diff --git a/docs/en/development/build-cross-s390x.md b/docs/en/development/build-cross-s390x.md
index 088dd6f2679..b7cda515d77 100644
--- a/docs/en/development/build-cross-s390x.md
+++ b/docs/en/development/build-cross-s390x.md
@@ -1,206 +1,206 @@
----
-slug: /en/development/build-cross-s390x
-sidebar_position: 69
-title: How to Build, Run and Debug ClickHouse on Linux for s390x (zLinux)
-sidebar_label: Build on Linux for s390x (zLinux)
----
-
-As of writing (2023/3/10) building for s390x considered to be experimental. Not all features can be enabled, has broken features and is currently under active development. 
-
-
-## Building
-
-As s390x does not support boringssl, it uses OpenSSL and has two related build options. 
-- By default, the s390x build will dynamically link to OpenSSL libraries. It will build OpenSSL shared objects, so it's not necessary to install OpenSSL beforehand. (This option is recommended in all cases.)
-- Another option is to build OpenSSL in-tree. In this case two build flags need to be supplied to cmake
-```bash
--DENABLE_OPENSSL_DYNAMIC=0 -DENABLE_OPENSSL=1
-```
-
-These instructions assume that the host machine is x86_64 and has all the tooling required to build natively based on the [build instructions](../development/build.md). It also assumes that the host is Ubuntu 22.04 but the following instructions should also work on Ubuntu 20.04.
-
-In addition to installing the tooling used to build natively, the following additional packages need to be installed:
-
-```bash
-apt-get install binutils-s390x-linux-gnu libc6-dev-s390x-cross gcc-s390x-linux-gnu binfmt-support qemu-user-static
-```
-
-If you wish to cross compile rust code install the rust cross compile target for s390x:
-```bash
-rustup target add s390x-unknown-linux-gnu
-```
-
-To build for s390x:
-```bash
-cmake -DCMAKE_TOOLCHAIN_FILE=cmake/linux/toolchain-s390x.cmake ..
-ninja
-```
-
-## Running
-
-Once built, the binary can be run with, eg.:
-
-```bash
-qemu-s390x-static -L /usr/s390x-linux-gnu ./clickhouse
-```
-
-## Debugging
-
-Install LLDB:
-
-```bash
-apt-get install lldb-15
-```
-
-To Debug a s390x executable, run clickhouse using QEMU in debug mode:
-
-```bash
-qemu-s390x-static -g 31338 -L /usr/s390x-linux-gnu ./clickhouse
-```
-
-In another shell run LLDB and attach, replace `<Clickhouse Parent Directory>` and `<build directory>` with the values corresponding to your environment.
-```bash
-lldb-15
-(lldb) target create ./clickhouse
-Current executable set to '/<Clickhouse Parent Directory>/ClickHouse/<build directory>/programs/clickhouse' (s390x).
-(lldb) settings set target.source-map <build directory> /<Clickhouse Parent Directory>/ClickHouse
-(lldb) gdb-remote 31338
-Process 1 stopped
-* thread #1, stop reason = signal SIGTRAP
-    frame #0: 0x0000004020e74cd0
-->  0x4020e74cd0: lgr    %r2, %r15
-    0x4020e74cd4: aghi   %r15, -160
-    0x4020e74cd8: xc     0(8,%r15), 0(%r15)
-    0x4020e74cde: brasl  %r14, 275429939040
-(lldb) b main
-Breakpoint 1: 9 locations.
-(lldb) c
-Process 1 resuming
-Process 1 stopped
-* thread #1, stop reason = breakpoint 1.1
-    frame #0: 0x0000004005cd9fc0 clickhouse`main(argc_=1, argv_=0x0000004020e594a8) at main.cpp:450:17
-   447  #if !defined(FUZZING_MODE)
-   448  int main(int argc_, char ** argv_)
-   449  {
--> 450      inside_main = true;
-   451      SCOPE_EXIT({ inside_main = false; });
-   452
-   453      /// PHDR cache is required for query profiler to work reliably
-```
-
-## Visual Studio Code integration
-
-- [CodeLLDB](https://github.com/vadimcn/vscode-lldb) extension is required for visual debugging.
-- [Command Variable](https://github.com/rioj7/command-variable) extension can help dynamic launches if using [CMake Variants](https://github.com/microsoft/vscode-cmake-tools/blob/main/docs/variants.md).
-- Make sure to set the backend to your LLVM installation eg. `"lldb.library": "/usr/lib/x86_64-linux-gnu/liblldb-15.so"`
-- Make sure to run the clickhouse executable in debug mode prior to launch. (It is also possible to create a `preLaunchTask` that automates this)
-
-### Example configurations
-#### cmake-variants.yaml
-```yaml
-buildType:
-  default: relwithdebinfo
-  choices:
-    debug:
-      short: Debug
-      long: Emit debug information
-      buildType: Debug
-    release:
-      short: Release
-      long: Optimize generated code
-      buildType: Release
-    relwithdebinfo:
-      short: RelWithDebInfo
-      long: Release with Debug Info
-      buildType: RelWithDebInfo
-    tsan:
-      short: MinSizeRel
-      long: Minimum Size Release
-      buildType: MinSizeRel
-
-toolchain:
-  default: default
-  description: Select toolchain
-  choices:
-    default:
-      short: x86_64
-      long: x86_64
-    s390x:
-      short: s390x
-      long: s390x
-      settings:
-        CMAKE_TOOLCHAIN_FILE: cmake/linux/toolchain-s390x.cmake
-```
-
-#### launch.json
-```json
-{
-    "version": "0.2.0",
-    "configurations": [
-        {
-            "type": "lldb",
-            "request": "custom",
-            "name": "(lldb) Launch s390x with qemu",
-            "targetCreateCommands": ["target create ${command:cmake.launchTargetPath}"],
-            "processCreateCommands": ["gdb-remote 2159"],
-            "preLaunchTask": "Run ClickHouse"
-        }
-    ]
-}
-```
-
-#### settings.json
-This would also put different builds under different subfolders of the `build` folder.
-```json
-{
-    "cmake.buildDirectory": "${workspaceFolder}/build/${buildKitVendor}-${buildKitVersion}-${variant:toolchain}-${variant:buildType}",
-    "lldb.library": "/usr/lib/x86_64-linux-gnu/liblldb-15.so"
-}
-```
-
-#### run-debug.sh
-```sh
-#! /bin/sh
-echo 'Starting debugger session'
-cd $1
-qemu-s390x-static -g 2159 -L /usr/s390x-linux-gnu $2 $3 $4
-```
-
-#### tasks.json
-Defines a task to run the compiled executable in `server` mode under a `tmp` folder next to the binaries, with configuration from under `programs/server/config.xml`.
-```json
-{
-    "version": "2.0.0",
-    "tasks": [
-        {
-            "label": "Run ClickHouse",
-            "type": "shell",
-            "isBackground": true,
-            "command": "${workspaceFolder}/.vscode/run-debug.sh",
-            "args": [
-                "${command:cmake.launchTargetDirectory}/tmp",
-                "${command:cmake.launchTargetPath}",
-                "server",
-                "--config-file=${workspaceFolder}/programs/server/config.xml"
-            ],
-            "problemMatcher": [
-                {
-                    "pattern": [
-                        {
-                            "regexp": ".",
-                            "file": 1,
-                            "location": 2,
-                            "message": 3
-                        }
-                    ],
-                    "background": {
-                        "activeOnStart": true,
-                        "beginsPattern": "^Starting debugger session",
-                        "endsPattern": ".*"
-                    }
-                }
-            ]
-        }
-    ]
-}
-```
+---
+slug: /en/development/build-cross-s390x
+sidebar_position: 69
+title: How to Build, Run and Debug ClickHouse on Linux for s390x (zLinux)
+sidebar_label: Build on Linux for s390x (zLinux)
+---
+
+As of writing (2023/3/10) building for s390x considered to be experimental. Not all features can be enabled, has broken features and is currently under active development. 
+
+
+## Building
+
+As s390x does not support boringssl, it uses OpenSSL and has two related build options. 
+- By default, the s390x build will dynamically link to OpenSSL libraries. It will build OpenSSL shared objects, so it's not necessary to install OpenSSL beforehand. (This option is recommended in all cases.)
+- Another option is to build OpenSSL in-tree. In this case two build flags need to be supplied to cmake
+```bash
+-DENABLE_OPENSSL_DYNAMIC=0 -DENABLE_OPENSSL=1
+```
+
+These instructions assume that the host machine is x86_64 and has all the tooling required to build natively based on the [build instructions](../development/build.md). It also assumes that the host is Ubuntu 22.04 but the following instructions should also work on Ubuntu 20.04.
+
+In addition to installing the tooling used to build natively, the following additional packages need to be installed:
+
+```bash
+apt-get install binutils-s390x-linux-gnu libc6-dev-s390x-cross gcc-s390x-linux-gnu binfmt-support qemu-user-static
+```
+
+If you wish to cross compile rust code install the rust cross compile target for s390x:
+```bash
+rustup target add s390x-unknown-linux-gnu
+```
+
+To build for s390x:
+```bash
+cmake -DCMAKE_TOOLCHAIN_FILE=cmake/linux/toolchain-s390x.cmake ..
+ninja
+```
+
+## Running
+
+Once built, the binary can be run with, eg.:
+
+```bash
+qemu-s390x-static -L /usr/s390x-linux-gnu ./clickhouse
+```
+
+## Debugging
+
+Install LLDB:
+
+```bash
+apt-get install lldb-15
+```
+
+To Debug a s390x executable, run clickhouse using QEMU in debug mode:
+
+```bash
+qemu-s390x-static -g 31338 -L /usr/s390x-linux-gnu ./clickhouse
+```
+
+In another shell run LLDB and attach, replace `<Clickhouse Parent Directory>` and `<build directory>` with the values corresponding to your environment.
+```bash
+lldb-15
+(lldb) target create ./clickhouse
+Current executable set to '/<Clickhouse Parent Directory>/ClickHouse/<build directory>/programs/clickhouse' (s390x).
+(lldb) settings set target.source-map <build directory> /<Clickhouse Parent Directory>/ClickHouse
+(lldb) gdb-remote 31338
+Process 1 stopped
+* thread #1, stop reason = signal SIGTRAP
+    frame #0: 0x0000004020e74cd0
+->  0x4020e74cd0: lgr    %r2, %r15
+    0x4020e74cd4: aghi   %r15, -160
+    0x4020e74cd8: xc     0(8,%r15), 0(%r15)
+    0x4020e74cde: brasl  %r14, 275429939040
+(lldb) b main
+Breakpoint 1: 9 locations.
+(lldb) c
+Process 1 resuming
+Process 1 stopped
+* thread #1, stop reason = breakpoint 1.1
+    frame #0: 0x0000004005cd9fc0 clickhouse`main(argc_=1, argv_=0x0000004020e594a8) at main.cpp:450:17
+   447  #if !defined(FUZZING_MODE)
+   448  int main(int argc_, char ** argv_)
+   449  {
+-> 450      inside_main = true;
+   451      SCOPE_EXIT({ inside_main = false; });
+   452
+   453      /// PHDR cache is required for query profiler to work reliably
+```
+
+## Visual Studio Code integration
+
+- [CodeLLDB](https://github.com/vadimcn/vscode-lldb) extension is required for visual debugging.
+- [Command Variable](https://github.com/rioj7/command-variable) extension can help dynamic launches if using [CMake Variants](https://github.com/microsoft/vscode-cmake-tools/blob/main/docs/variants.md).
+- Make sure to set the backend to your LLVM installation eg. `"lldb.library": "/usr/lib/x86_64-linux-gnu/liblldb-15.so"`
+- Make sure to run the clickhouse executable in debug mode prior to launch. (It is also possible to create a `preLaunchTask` that automates this)
+
+### Example configurations
+#### cmake-variants.yaml
+```yaml
+buildType:
+  default: relwithdebinfo
+  choices:
+    debug:
+      short: Debug
+      long: Emit debug information
+      buildType: Debug
+    release:
+      short: Release
+      long: Optimize generated code
+      buildType: Release
+    relwithdebinfo:
+      short: RelWithDebInfo
+      long: Release with Debug Info
+      buildType: RelWithDebInfo
+    tsan:
+      short: MinSizeRel
+      long: Minimum Size Release
+      buildType: MinSizeRel
+
+toolchain:
+  default: default
+  description: Select toolchain
+  choices:
+    default:
+      short: x86_64
+      long: x86_64
+    s390x:
+      short: s390x
+      long: s390x
+      settings:
+        CMAKE_TOOLCHAIN_FILE: cmake/linux/toolchain-s390x.cmake
+```
+
+#### launch.json
+```json
+{
+    "version": "0.2.0",
+    "configurations": [
+        {
+            "type": "lldb",
+            "request": "custom",
+            "name": "(lldb) Launch s390x with qemu",
+            "targetCreateCommands": ["target create ${command:cmake.launchTargetPath}"],
+            "processCreateCommands": ["gdb-remote 2159"],
+            "preLaunchTask": "Run ClickHouse"
+        }
+    ]
+}
+```
+
+#### settings.json
+This would also put different builds under different subfolders of the `build` folder.
+```json
+{
+    "cmake.buildDirectory": "${workspaceFolder}/build/${buildKitVendor}-${buildKitVersion}-${variant:toolchain}-${variant:buildType}",
+    "lldb.library": "/usr/lib/x86_64-linux-gnu/liblldb-15.so"
+}
+```
+
+#### run-debug.sh
+```sh
+#! /bin/sh
+echo 'Starting debugger session'
+cd $1
+qemu-s390x-static -g 2159 -L /usr/s390x-linux-gnu $2 $3 $4
+```
+
+#### tasks.json
+Defines a task to run the compiled executable in `server` mode under a `tmp` folder next to the binaries, with configuration from under `programs/server/config.xml`.
+```json
+{
+    "version": "2.0.0",
+    "tasks": [
+        {
+            "label": "Run ClickHouse",
+            "type": "shell",
+            "isBackground": true,
+            "command": "${workspaceFolder}/.vscode/run-debug.sh",
+            "args": [
+                "${command:cmake.launchTargetDirectory}/tmp",
+                "${command:cmake.launchTargetPath}",
+                "server",
+                "--config-file=${workspaceFolder}/programs/server/config.xml"
+            ],
+            "problemMatcher": [
+                {
+                    "pattern": [
+                        {
+                            "regexp": ".",
+                            "file": 1,
+                            "location": 2,
+                            "message": 3
+                        }
+                    ],
+                    "background": {
+                        "activeOnStart": true,
+                        "beginsPattern": "^Starting debugger session",
+                        "endsPattern": ".*"
+                    }
+                }
+            ]
+        }
+    ]
+}
+```
diff --git a/docs/en/development/build-osx.md b/docs/en/development/build-osx.md
index e65de4a37e0..39ccc9a78c3 100644
--- a/docs/en/development/build-osx.md
+++ b/docs/en/development/build-osx.md
@@ -3,7 +3,7 @@ slug: /en/development/build-osx
 sidebar_position: 65
 sidebar_label: Build on macOS
 title: How to Build ClickHouse on macOS
-description: How to build ClickHouse on macOS
+description: How to build ClickHouse on macOS for macOS
 ---
 
 :::info You don't have to build ClickHouse yourself!
diff --git a/docs/en/development/developer-instruction.md b/docs/en/development/developer-instruction.md
index 9d6a80de904..31346c77949 100644
--- a/docs/en/development/developer-instruction.md
+++ b/docs/en/development/developer-instruction.md
@@ -7,42 +7,39 @@ description: Prerequisites and an overview of how to build ClickHouse
 
 # Getting Started Guide for Building ClickHouse
 
-The building of ClickHouse is supported on Linux, FreeBSD and macOS.
+ClickHouse can be build on Linux, FreeBSD and macOS. If you use Windows, you can still build ClickHouse in a virtual machine running Linux, e.g. [VirtualBox](https://www.virtualbox.org/) with Ubuntu.
 
-If you use Windows, you need to create a virtual machine with Ubuntu. To start working with a virtual machine please install VirtualBox. You can download Ubuntu from the website: https://www.ubuntu.com/#download. Please create a virtual machine from the downloaded image (you should reserve at least 4GB of RAM for it). To run a command-line terminal in Ubuntu, please locate a program containing the word “terminal” in its name (gnome-terminal, konsole etc.) or just press Ctrl+Alt+T.
-
-ClickHouse cannot work or build on a 32-bit system. You should acquire access to a 64-bit system and you can continue reading.
+ClickHouse requires a 64-bit system to compile and run, 32-bit systems do not work.
 
 ## Creating a Repository on GitHub {#creating-a-repository-on-github}
 
-To start working with ClickHouse repository you will need a GitHub account.
+To start developing for ClickHouse you will need a [GitHub](https://www.virtualbox.org/) account. Please also generate a SSH key locally (if you don't have one already) and upload the public key to GitHub as this is a prerequisite for contributing patches.
 
-You probably already have one, but if you do not, please register at https://github.com. In case you do not have SSH keys, you should generate them and then upload them on GitHub. It is required for sending over your patches. It is also possible to use the same SSH keys that you use with any other SSH servers - probably you already have those.
+Next, create a fork of the [ClickHouse repository](https://github.com/ClickHouse/ClickHouse/) in your personal account by clicking the "fork" button in the upper right corner.
 
-Create a fork of ClickHouse repository. To do that please click on the “fork” button in the upper right corner at https://github.com/ClickHouse/ClickHouse. It will fork your own copy of ClickHouse/ClickHouse to your account.
+To contribute, e.g. a fix for an issue or a feature, please commit your changes to a branch in your fork, then create a "pull request" with the changes to the main repository.
 
-The development process consists of first committing the intended changes into your fork of ClickHouse and then creating a “pull request” for these changes to be accepted into the main repository (ClickHouse/ClickHouse).
+For working with Git repositories, please install `git`. In Ubuntu run these commands in a terminal:
 
-To work with Git repositories, please install `git`. To do that in Ubuntu you would run in the command line terminal:
+```sh
+sudo apt update
+sudo apt install git
+```
 
-    sudo apt update
-    sudo apt install git
-
-A brief manual on using Git can be found [here](https://education.github.com/git-cheat-sheet-education.pdf).
-For a detailed manual on Git see [here](https://git-scm.com/book/en/v2).
+A cheatsheet for using Git can be found [here](https://education.github.com/git-cheat-sheet-education.pdf). The detailed manual for Git is [here](https://git-scm.com/book/en/v2).
 
 ## Cloning a Repository to Your Development Machine {#cloning-a-repository-to-your-development-machine}
 
-Next, you need to download the source files onto your working machine. This is called “to clone a repository” because it creates a local copy of the repository on your working machine.
+First, download the source files to your working machine, i.e. clone the repository:
 
-Run in your terminal:
+```sh
+git clone git@github.com:your_github_username/ClickHouse.git  # replace placeholder with your GitHub user name
+cd ClickHouse
+```
 
-    git clone git@github.com:your_github_username/ClickHouse.git  # replace placeholder with your GitHub user name
-    cd ClickHouse
+This command creates a directory `ClickHouse/` containing the source code of ClickHouse. If you specify a custom checkout directory after the URL but it is important that this path does not contain whitespaces as it may lead to problems with the build later on.
 
-This command will create a directory `ClickHouse/` containing the source code of ClickHouse. If you specify a custom checkout directory (after the URL), it is important that this path does not contain whitespaces as it may lead to problems with the build system.
-
-To make library dependencies available for the build, the ClickHouse repository uses Git submodules, i.e. references to external repositories. These are not checked out by default. To do so, you can either
+The ClickHouse repository uses Git submodules, i.e. references to external repositories (usually 3rd party libraries used by ClickHouse). These are not checked out by default. To do so, you can either
 
 - run `git clone` with option `--recurse-submodules`,
 
@@ -52,7 +49,7 @@ To make library dependencies available for the build, the ClickHouse repository
 
 You can check the Git status with the command: `git submodule status`.
 
-If you get the following error message:
+If you get the following error message
 
     Permission denied (publickey).
     fatal: Could not read from remote repository.
@@ -60,7 +57,7 @@ If you get the following error message:
     Please make sure you have the correct access rights
     and the repository exists.
 
-It generally means that the SSH keys for connecting to GitHub are missing. These keys are normally located in `~/.ssh`. For SSH keys to be accepted you need to upload them in the settings section of GitHub UI.
+it generally means that the SSH keys for connecting to GitHub are missing. These keys are normally located in `~/.ssh`. For SSH keys to be accepted you need to upload them in GitHub's settings.
 
 You can also clone the repository via https protocol:
 
@@ -74,12 +71,17 @@ You can also add original ClickHouse repo address to your local repository to pu
 
 After successfully running this command you will be able to pull updates from the main ClickHouse repo by running `git pull upstream master`.
 
+:::note 
+Instructions below assume you are building on Linux. If you are cross-compiling or building on macOS, please also check for operating system and architecture specific guides, such as building [on macOS for macOS](build-osx.md), [on Linux for macOS](build-cross-osx.md), [on Linux for Linux/RISC-V](build-cross-riscv.md) and so on.
+:::
+
 ## Build System {#build-system}
 
 ClickHouse uses CMake and Ninja for building.
 
-CMake - a meta-build system that can generate Ninja files (build tasks).
-Ninja - a smaller build system with a focus on the speed used to execute those cmake generated tasks.
+- CMake - a meta-build system that can generate Ninja files (build tasks).
+
+- Ninja - a smaller build system with a focus on the speed used to execute those cmake generated tasks.
 
 To install on Ubuntu, Debian or Mint run `sudo apt install cmake ninja-build`.
 
diff --git a/docs/en/development/style.md b/docs/en/development/style.md
index 0b71a669638..77a550f2a0e 100644
--- a/docs/en/development/style.md
+++ b/docs/en/development/style.md
@@ -489,7 +489,7 @@ When using functions with response codes or `errno`, always check the result and
 
 ``` cpp
 if (0 != close(fd))
-    throwFromErrno("Cannot close file " + file_name, ErrorCodes::CANNOT_CLOSE_FILE);
+    throw ErrnoException(ErrorCodes::CANNOT_CLOSE_FILE, "Cannot close file {}", file_name);
 ```
 
 You can use assert to check invariant in code.
diff --git a/docs/en/engines/table-engines/index.md b/docs/en/engines/table-engines/index.md
index b024820024a..5e81eacc937 100644
--- a/docs/en/engines/table-engines/index.md
+++ b/docs/en/engines/table-engines/index.md
@@ -67,7 +67,6 @@ Engines in the family:
 Engines in the family:
 
 - [Distributed](../../engines/table-engines/special/distributed.md#distributed)
-- [MaterializedView](../../engines/table-engines/special/materializedview.md#materializedview)
 - [Dictionary](../../engines/table-engines/special/dictionary.md#dictionary)
 - [Merge](../../engines/table-engines/special/merge.md#merge)
 - [File](../../engines/table-engines/special/file.md#file)
diff --git a/docs/en/engines/table-engines/integrations/embedded-rocksdb.md b/docs/en/engines/table-engines/integrations/embedded-rocksdb.md
index 9af857b0835..44febe78c77 100644
--- a/docs/en/engines/table-engines/integrations/embedded-rocksdb.md
+++ b/docs/en/engines/table-engines/integrations/embedded-rocksdb.md
@@ -212,5 +212,5 @@ ORDER BY key ASC
 ```
 
 ### More information on Joins
-- [`join_algorithm` setting](/docs/en/operations/settings/settings.md#settings-join_algorithm)
+- [`join_algorithm` setting](/docs/en/operations/settings/settings.md#join_algorithm)
 - [JOIN clause](/docs/en/sql-reference/statements/select/join.md)
diff --git a/docs/en/engines/table-engines/integrations/hdfs.md b/docs/en/engines/table-engines/integrations/hdfs.md
index 19221c256f9..96e6bab6997 100644
--- a/docs/en/engines/table-engines/integrations/hdfs.md
+++ b/docs/en/engines/table-engines/integrations/hdfs.md
@@ -236,7 +236,7 @@ libhdfs3 support HDFS namenode HA.
 
 ## Storage Settings {#storage-settings}
 
-- [hdfs_truncate_on_insert](/docs/en/operations/settings/settings.md#hdfs-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [hdfs_truncate_on_insert](/docs/en/operations/settings/settings.md#hdfs_truncate_on_insert) - allows to truncate file before insert into it. Disabled by default.
 - [hdfs_create_multiple_files](/docs/en/operations/settings/settings.md#hdfs_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
 - [hdfs_skip_empty_files](/docs/en/operations/settings/settings.md#hdfs_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
 
diff --git a/docs/en/engines/table-engines/integrations/kafka.md b/docs/en/engines/table-engines/integrations/kafka.md
index de1a090d491..141d87fed20 100644
--- a/docs/en/engines/table-engines/integrations/kafka.md
+++ b/docs/en/engines/table-engines/integrations/kafka.md
@@ -54,7 +54,7 @@ Optional parameters:
 
 - `kafka_schema` — Parameter that must be used if the format requires a schema definition. For example, [Cap’n Proto](https://capnproto.org/) requires the path to the schema file and the name of the root `schema.capnp:Message` object.
 - `kafka_num_consumers` — The number of consumers per table. Specify more consumers if the throughput of one consumer is insufficient. The total number of consumers should not exceed the number of partitions in the topic, since only one consumer can be assigned per partition, and must not be greater than the number of physical cores on the server where ClickHouse is deployed. Default: `1`.
-- `kafka_max_block_size` — The maximum batch size (in messages) for poll. Default: [max_insert_block_size](../../../operations/settings/settings.md#setting-max_insert_block_size).
+- `kafka_max_block_size` — The maximum batch size (in messages) for poll. Default: [max_insert_block_size](../../../operations/settings/settings.md#max_insert_block_size).
 - `kafka_skip_broken_messages` — Kafka message parser tolerance to schema-incompatible messages per block. If `kafka_skip_broken_messages = N` then the engine skips *N* Kafka messages that cannot be parsed (a message equals a row of data). Default: `0`.
 - `kafka_commit_every_batch` — Commit every consumed and handled batch instead of a single commit after writing a whole block. Default: `0`.
 - `kafka_client_id` — Client identifier. Empty by default.
@@ -151,7 +151,7 @@ Example:
 
   SELECT level, sum(total) FROM daily GROUP BY level;
 ```
-To improve performance, received messages are grouped into blocks the size of [max_insert_block_size](../../../operations/settings/settings.md#settings-max_insert_block_size). If the block wasn’t formed within [stream_flush_interval_ms](../../../operations/settings/settings.md/#stream-flush-interval-ms) milliseconds, the data will be flushed to the table regardless of the completeness of the block.
+To improve performance, received messages are grouped into blocks the size of [max_insert_block_size](../../../operations/settings/settings.md#max_insert_block_size). If the block wasn’t formed within [stream_flush_interval_ms](../../../operations/settings/settings.md/#stream-flush-interval-ms) milliseconds, the data will be flushed to the table regardless of the completeness of the block.
 
 To stop receiving topic data or to change the conversion logic, detach the materialized view:
 
diff --git a/docs/en/engines/table-engines/integrations/nats.md b/docs/en/engines/table-engines/integrations/nats.md
index 37a41159fab..e898d1f1b82 100644
--- a/docs/en/engines/table-engines/integrations/nats.md
+++ b/docs/en/engines/table-engines/integrations/nats.md
@@ -58,7 +58,7 @@ Optional parameters:
 - `nats_reconnect_wait` – Amount of time in milliseconds to sleep between each reconnect attempt. Default: `5000`.
 - `nats_server_list` - Server list for connection. Can be specified to connect to NATS cluster.
 - `nats_skip_broken_messages` - NATS message parser tolerance to schema-incompatible messages per block. Default: `0`. If `nats_skip_broken_messages = N` then the engine skips *N* RabbitMQ messages that cannot be parsed (a message equals a row of data).
-- `nats_max_block_size` - Number of row collected by poll(s) for flushing data from NATS. Default: [max_insert_block_size](../../../operations/settings/settings.md#setting-max_insert_block_size).
+- `nats_max_block_size` - Number of row collected by poll(s) for flushing data from NATS. Default: [max_insert_block_size](../../../operations/settings/settings.md#max_insert_block_size).
 - `nats_flush_interval_ms` - Timeout for flushing data read from NATS. Default: [stream_flush_interval_ms](../../../operations/settings/settings.md#stream-flush-interval-ms).
 - `nats_username` - NATS username.
 - `nats_password` - NATS password.
diff --git a/docs/en/engines/table-engines/integrations/rabbitmq.md b/docs/en/engines/table-engines/integrations/rabbitmq.md
index 53c6e089a70..0f3fef3d6fb 100644
--- a/docs/en/engines/table-engines/integrations/rabbitmq.md
+++ b/docs/en/engines/table-engines/integrations/rabbitmq.md
@@ -65,7 +65,7 @@ Optional parameters:
 - `rabbitmq_deadletter_exchange` - Specify name for a [dead letter exchange](https://www.rabbitmq.com/dlx.html). You can create another table with this exchange name and collect messages in cases when they are republished to dead letter exchange. By default dead letter exchange is not specified.
 - `rabbitmq_persistent` - If set to 1 (true), in insert query delivery mode will be set to 2 (marks messages as 'persistent'). Default: `0`.
 - `rabbitmq_skip_broken_messages` – RabbitMQ message parser tolerance to schema-incompatible messages per block. If `rabbitmq_skip_broken_messages = N` then the engine skips *N* RabbitMQ messages that cannot be parsed (a message equals a row of data). Default: `0`.
-- `rabbitmq_max_block_size` - Number of row collected before flushing data from RabbitMQ. Default: [max_insert_block_size](../../../operations/settings/settings.md#setting-max_insert_block_size).
+- `rabbitmq_max_block_size` - Number of row collected before flushing data from RabbitMQ. Default: [max_insert_block_size](../../../operations/settings/settings.md#max_insert_block_size).
 - `rabbitmq_flush_interval_ms` - Timeout for flushing data from RabbitMQ. Default: [stream_flush_interval_ms](../../../operations/settings/settings.md#stream-flush-interval-ms).
 - `rabbitmq_queue_settings_list` - allows to set RabbitMQ settings when creating a queue. Available settings: `x-max-length`, `x-max-length-bytes`, `x-message-ttl`, `x-expires`, `x-priority`, `x-max-priority`, `x-overflow`, `x-dead-letter-exchange`, `x-queue-type`. The `durable` setting is enabled automatically for the queue.
 - `rabbitmq_address` - Address for connection. Use ether this setting or `rabbitmq_host_port`.
diff --git a/docs/en/engines/table-engines/integrations/s3.md b/docs/en/engines/table-engines/integrations/s3.md
index 3144bdd32fa..dfa06801d04 100644
--- a/docs/en/engines/table-engines/integrations/s3.md
+++ b/docs/en/engines/table-engines/integrations/s3.md
@@ -222,7 +222,7 @@ CREATE TABLE table_with_asterisk (name String, value UInt32)
 
 ## Storage Settings {#storage-settings}
 
-- [s3_truncate_on_insert](/docs/en/operations/settings/settings.md#s3-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [s3_truncate_on_insert](/docs/en/operations/settings/settings.md#s3_truncate_on_insert) - allows to truncate file before insert into it. Disabled by default.
 - [s3_create_multiple_files](/docs/en/operations/settings/settings.md#s3_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
 - [s3_skip_empty_files](/docs/en/operations/settings/settings.md#s3_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
 
diff --git a/docs/en/engines/table-engines/integrations/s3queue.md b/docs/en/engines/table-engines/integrations/s3queue.md
index 2a9b25e0c1a..8b7f86cce5c 100644
--- a/docs/en/engines/table-engines/integrations/s3queue.md
+++ b/docs/en/engines/table-engines/integrations/s3queue.md
@@ -4,16 +4,9 @@ sidebar_position: 181
 sidebar_label: S3Queue
 ---
 
-# [experimental] S3Queue Table Engine
+# S3Queue Table Engine
 This engine provides integration with [Amazon S3](https://aws.amazon.com/s3/) ecosystem and allows streaming import. This engine is similar to the [Kafka](../../../engines/table-engines/integrations/kafka.md), [RabbitMQ](../../../engines/table-engines/integrations/rabbitmq.md) engines, but provides S3-specific features.
 
-:::note
-This table engine is experimental. To use it, set `allow_experimental_s3queue` to 1 by using the `SET` command:
-```sql
-SET allow_experimental_s3queue=1
-```
-:::
-
 ## Create Table {#creating-a-table}
 
 ``` sql
diff --git a/docs/en/engines/table-engines/mergetree-family/custom-partitioning-key.md b/docs/en/engines/table-engines/mergetree-family/custom-partitioning-key.md
index 97d37e476ae..23d98d4b20e 100644
--- a/docs/en/engines/table-engines/mergetree-family/custom-partitioning-key.md
+++ b/docs/en/engines/table-engines/mergetree-family/custom-partitioning-key.md
@@ -12,7 +12,7 @@ In most cases you do not need a partition key, and in most other cases you do no
 You should never use too granular of partitioning. Don't partition your data by client identifiers or names. Instead, make a client identifier or name the first column in the ORDER BY expression.
 :::
 
-Partitioning is available for the [MergeTree](../../../engines/table-engines/mergetree-family/mergetree.md) family tables (including [replicated](../../../engines/table-engines/mergetree-family/replication.md) tables). [Materialized views](../../../engines/table-engines/special/materializedview.md#materializedview) based on MergeTree tables support partitioning, as well.
+Partitioning is available for the [MergeTree family tables](../../../engines/table-engines/mergetree-family/mergetree.md), including [replicated tables](../../../engines/table-engines/mergetree-family/replication.md) and [materialized views](../../../sql-reference/statements/create/view.md#materialized-view).
 
 A partition is a logical combination of records in a table by a specified criterion. You can set a partition by an arbitrary criterion, such as by month, by day, or by event type. Each partition is stored separately to simplify manipulations of this data. When accessing the data, ClickHouse uses the smallest subset of partitions possible. Partitions improve performance for queries containing a partitioning key because ClickHouse will filter for that partition before selecting the parts and granules within the partition.
 
diff --git a/docs/en/engines/table-engines/mergetree-family/mergetree.md b/docs/en/engines/table-engines/mergetree-family/mergetree.md
index 89b002da192..ed413959ca6 100644
--- a/docs/en/engines/table-engines/mergetree-family/mergetree.md
+++ b/docs/en/engines/table-engines/mergetree-family/mergetree.md
@@ -520,7 +520,7 @@ Indexes of type `set` can be utilized by all functions. The other index types ar
 | [empty](/docs/en/sql-reference/functions/array-functions#function-empty)                                   | ✔           | ✔      | ✗          | ✗          | ✗            | ✗        |
 | [notEmpty](/docs/en/sql-reference/functions/array-functions#function-notempty)                             | ✔           | ✔      | ✗          | ✗          | ✗            | ✗        |
 | [has](/docs/en/sql-reference/functions/array-functions#function-has)                                       | ✗           | ✗      | ✔          | ✔          | ✔            | ✔        |
-| [hasAny](/docs/en/sql-reference/functions/array-functions#function-hasAny)                                 | ✗           | ✗      | ✗          | ✗          | ✔            | ✗        |
+| [hasAny](/docs/en/sql-reference/functions/array-functions#function-hasAny)                                 | ✗           | ✗      | ✔          | ✔          | ✔            | ✗        |
 | [hasAll](/docs/en/sql-reference/functions/array-functions#function-hasAll)                                 | ✗           | ✗      | ✗          | ✗          | ✔            | ✗        |
 | hasToken                                                                                                   | ✗           | ✗      | ✗          | ✔          | ✗            | ✔        |
 | hasTokenOrNull                                                                                             | ✗           | ✗      | ✗          | ✔          | ✗            | ✔        |
@@ -865,10 +865,10 @@ Tags:
 - `disk` — a disk within a volume.
 - `max_data_part_size_bytes` — the maximum size of a part that can be stored on any of the volume’s disks. If the a size of a merged part estimated to be bigger than `max_data_part_size_bytes` then this part will be written to a next volume. Basically this feature allows to keep new/small parts on a hot (SSD) volume and move them to a cold (HDD) volume when they reach large size. Do not use this setting if your policy has only one volume.
 - `move_factor` — when the amount of available space gets lower than this factor, data automatically starts to move on the next volume if any (by default, 0.1). ClickHouse sorts existing parts by size from largest to smallest (in descending order) and selects parts with the total size that is sufficient to meet the `move_factor` condition. If the total size of all parts is insufficient, all parts will be moved.
-- `prefer_not_to_merge` — Disables merging of data parts on this volume. When this setting is enabled, merging data on this volume is not allowed. This allows controlling how ClickHouse works with slow disks.
 - `perform_ttl_move_on_insert` — Disables TTL move on data part INSERT. By default (if enabled) if we insert a data part that already expired by the TTL move rule it immediately goes to a volume/disk declared in move rule. This can significantly slowdown insert in case if destination volume/disk is slow (e.g. S3). If disabled then already expired data part is written into a default volume and then right after moved to TTL volume.
 - `load_balancing` - Policy for disk balancing, `round_robin` or `least_used`.
 - `least_used_ttl_ms` - Configure timeout (in milliseconds) for the updating available space on all disks (`0` - update always, `-1` - never update, default is `60000`). Note, if the disk can be used by ClickHouse only and is not subject to a online filesystem resize/shrink you can use `-1`, in all other cases it is not recommended, since eventually it will lead to incorrect space distribution.
+- `prefer_not_to_merge` — You should not use this setting. Disables merging of data parts on this volume (this is harmful and leads to performance degradation). When this setting is enabled (don't do it), merging data on this volume is not allowed (which is bad). This allows (but you don't need it) controlling (if you want to control something, you're making a mistake) how ClickHouse works with slow disks (but ClickHouse knows better, so please don't use this setting).
 
 Configuration examples:
 
@@ -905,7 +905,6 @@ Configuration examples:
                 </main>
                 <external>
                     <disk>external</disk>
-                    <prefer_not_to_merge>true</prefer_not_to_merge>
                 </external>
             </volumes>
         </small_jbod_with_external_no_merges>
diff --git a/docs/en/engines/table-engines/special/distributed.md b/docs/en/engines/table-engines/special/distributed.md
index 14431c4c43b..de8ae0357dc 100644
--- a/docs/en/engines/table-engines/special/distributed.md
+++ b/docs/en/engines/table-engines/special/distributed.md
@@ -1,13 +1,16 @@
 ---
-slug: /en/engines/table-engines/special/distributed
+sidebar_label: "Distributed"
 sidebar_position: 10
-sidebar_label: Distributed
+slug: /en/engines/table-engines/special/distributed
 ---
 
 # Distributed Table Engine
 
-Tables with Distributed engine do not store any data of their own, but allow distributed query processing on multiple servers.
-Reading is automatically parallelized. During a read, the table indexes on remote servers are used, if there are any.
+:::warning
+To create a distributed table engine in the cloud, you can use the [remote and remoteSecure](../../../sql-reference/table-functions/remote) table functions. The `Distributed(...)` syntax cannot be used in ClickHouse Cloud.
+:::
+
+Tables with Distributed engine do not store any data of their own, but allow distributed query processing on multiple servers. Reading is automatically parallelized. During a read, the table indexes on remote servers are used, if there are any.
 
 ## Creating a Table {#distributed-creating-a-table}
 
@@ -22,6 +25,7 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
 ```
 
 ### From a Table {#distributed-from-a-table}
+
 When the `Distributed` table is pointing to a table on the current server you can adopt that table's schema:
 
 ``` sql
@@ -48,7 +52,7 @@ CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster] AS [db2.]name2
 
 Specifying the `sharding_key` is necessary for the following:
 
-- For `INSERTs` into a distributed table (as the table engine needs the `sharding_key` to determine how to split the data). However, if `insert_distributed_one_random_shard` setting is enabled, then `INSERTs` do not need the sharding key
+- For `INSERTs` into a distributed table (as the table engine needs the `sharding_key` to determine how to split the data). However, if `insert_distributed_one_random_shard` setting is enabled, then `INSERTs` do not need the sharding key.
 - For use with `optimize_skip_unused_shards` as the `sharding_key` is necessary to determine what shards should be queried
 
 #### policy_name
@@ -108,7 +112,7 @@ Specifying the `sharding_key` is necessary for the following:
 For **Insert limit settings** (`..._insert`) see also:
 
 - [distributed_foreground_insert](../../../operations/settings/settings.md#distributed_foreground_insert) setting
-- [prefer_localhost_replica](../../../operations/settings/settings.md#settings-prefer-localhost-replica) setting
+- [prefer_localhost_replica](../../../operations/settings/settings.md#prefer-localhost-replica) setting
 - `bytes_to_throw_insert` handled before `bytes_to_delay_insert`, so you should not set it to the value less then `bytes_to_delay_insert`
 :::
 
@@ -122,9 +126,7 @@ SETTINGS
     fsync_directories=0;
 ```
 
-Data will be read from all servers in the `logs` cluster, from the `default.hits` table located on every server in the cluster.
-Data is not only read but is partially processed on the remote servers (to the extent that this is possible).
-For example, for a query with `GROUP BY`, data will be aggregated on remote servers, and the intermediate states of aggregate functions will be sent to the requestor server. Then data will be further aggregated.
+Data will be read from all servers in the `logs` cluster, from the `default.hits` table located on every server in the cluster. Data is not only read but is partially processed on the remote servers (to the extent that this is possible). For example, for a query with `GROUP BY`, data will be aggregated on remote servers, and the intermediate states of aggregate functions will be sent to the requestor server. Then data will be further aggregated.
 
 Instead of the database name, you can use a constant expression that returns a string. For example: `currentDatabase()`.
 
@@ -183,9 +185,7 @@ Clusters are configured in the [server configuration file](../../../operations/c
 </remote_servers>
 ```
 
-Here a cluster is defined with the name `logs` that consists of two shards, each of which contains two replicas.
-Shards refer to the servers that contain different parts of the data (in order to read all the data, you must access all the shards).
-Replicas are duplicating servers (in order to read all the data, you can access the data on any one of the replicas).
+Here a cluster is defined with the name `logs` that consists of two shards, each of which contains two replicas. Shards refer to the servers that contain different parts of the data (in order to read all the data, you must access all the shards). Replicas are duplicating servers (in order to read all the data, you can access the data on any one of the replicas).
 
 Cluster names must not contain dots.
 
@@ -198,9 +198,7 @@ The parameters `host`, `port`, and optionally `user`, `password`, `secure`, `com
 - `secure` - Whether to use a secure SSL/TLS connection. Usually also requires specifying the port (the default secure port is `9440`). The server should listen on `<tcp_port_secure>9440</tcp_port_secure>` and be configured with correct certificates.
 - `compression` - Use data compression. Default value: `true`.
 
-When specifying replicas, one of the available replicas will be selected for each of the shards when reading. You can configure the algorithm for load balancing (the preference for which replica to access) – see the [load_balancing](../../../operations/settings/settings.md#settings-load_balancing) setting.
-If the connection with the server is not established, there will be an attempt to connect with a short timeout. If the connection failed, the next replica will be selected, and so on for all the replicas. If the connection attempt failed for all the replicas, the attempt will be repeated the same way, several times.
-This works in favour of resiliency, but does not provide complete fault tolerance: a remote server might accept the connection, but might not work, or work poorly.
+When specifying replicas, one of the available replicas will be selected for each of the shards when reading. You can configure the algorithm for load balancing (the preference for which replica to access) – see the [load_balancing](../../../operations/settings/settings.md#load_balancing) setting. If the connection with the server is not established, there will be an attempt to connect with a short timeout. If the connection failed, the next replica will be selected, and so on for all the replicas. If the connection attempt failed for all the replicas, the attempt will be repeated the same way, several times. This works in favour of resiliency, but does not provide complete fault tolerance: a remote server might accept the connection, but might not work, or work poorly.
 
 You can specify just one of the shards (in this case, query processing should be called remote, rather than distributed) or up to any number of shards. In each shard, you can specify from one to any number of replicas. You can specify a different number of replicas for each shard.
 
@@ -245,7 +243,7 @@ If the server ceased to exist or had a rough restart (for example, due to a hard
 
 When querying a `Distributed` table, `SELECT` queries are sent to all shards and work regardless of how data is distributed across the shards (they can be distributed completely randomly). When you add a new shard, you do not have to transfer old data into it. Instead, you can write new data to it by using a heavier weight – the data will be distributed slightly unevenly, but queries will work correctly and efficiently.
 
-When the `max_parallel_replicas` option is enabled, query processing is parallelized across all replicas within a single shard. For more information, see the section [max_parallel_replicas](../../../operations/settings/settings.md#settings-max_parallel_replicas).
+When the `max_parallel_replicas` option is enabled, query processing is parallelized across all replicas within a single shard. For more information, see the section [max_parallel_replicas](../../../operations/settings/settings.md#max_parallel_replicas).
 
 To learn more about how distributed `in` and `global in` queries are processed, refer to [this](../../../sql-reference/operators/in.md#select-distributed-subqueries) documentation.
 
diff --git a/docs/en/engines/table-engines/special/file.md b/docs/en/engines/table-engines/special/file.md
index 6e3897398a5..fdf5242ba3b 100644
--- a/docs/en/engines/table-engines/special/file.md
+++ b/docs/en/engines/table-engines/special/file.md
@@ -101,8 +101,8 @@ For partitioning by month, use the `toYYYYMM(date_column)` expression, where `da
 
 ## Settings {#settings}
 
-- [engine_file_empty_if_not_exists](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - allows to select empty data from a file that doesn't exist. Disabled by default.
+- [engine_file_empty_if_not_exists](/docs/en/operations/settings/settings.md#engine-file-empty_if-not-exists) - allows to select empty data from a file that doesn't exist. Disabled by default.
 - [engine_file_truncate_on_insert](/docs/en/operations/settings/settings.md#engine-file-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
 - [engine_file_allow_create_multiple_files](/docs/en/operations/settings/settings.md#engine_file_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
 - [engine_file_skip_empty_files](/docs/en/operations/settings/settings.md#engine_file_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
-- [storage_file_read_method](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - method of reading data from storage file, one of: `read`, `pread`, `mmap`. The mmap method does not apply to clickhouse-server (it's intended for clickhouse-local). Default value: `pread` for clickhouse-server, `mmap` for clickhouse-local.
+- [storage_file_read_method](/docs/en/operations/settings/settings.md#engine-file-empty_if-not-exists) - method of reading data from storage file, one of: `read`, `pread`, `mmap`. The mmap method does not apply to clickhouse-server (it's intended for clickhouse-local). Default value: `pread` for clickhouse-server, `mmap` for clickhouse-local.
diff --git a/docs/en/engines/table-engines/special/filelog.md b/docs/en/engines/table-engines/special/filelog.md
index eef9a17444e..82201053bc5 100644
--- a/docs/en/engines/table-engines/special/filelog.md
+++ b/docs/en/engines/table-engines/special/filelog.md
@@ -41,7 +41,7 @@ Optional parameters:
 
 - `poll_timeout_ms` - Timeout for single poll from log file. Default: [stream_poll_timeout_ms](../../../operations/settings/settings.md#stream_poll_timeout_ms).
 - `poll_max_batch_size` — Maximum amount of records to be polled in a single poll. Default: [max_block_size](../../../operations/settings/settings.md#setting-max_block_size).
-- `max_block_size` — The maximum batch size (in records) for poll. Default: [max_insert_block_size](../../../operations/settings/settings.md#setting-max_insert_block_size).
+- `max_block_size` — The maximum batch size (in records) for poll. Default: [max_insert_block_size](../../../operations/settings/settings.md#max_insert_block_size).
 - `max_threads` - Number of max threads to parse files, default is 0, which means the number will be max(1, physical_cpu_cores / 4).
 - `poll_directory_watch_events_backoff_init` - The initial sleep value for watch directory thread. Default: `500`.
 - `poll_directory_watch_events_backoff_max` - The max sleep value for watch directory thread. Default: `32000`.
diff --git a/docs/en/engines/table-engines/special/materializedview.md b/docs/en/engines/table-engines/special/materializedview.md
deleted file mode 100644
index d5f3b364d4e..00000000000
--- a/docs/en/engines/table-engines/special/materializedview.md
+++ /dev/null
@@ -1,9 +0,0 @@
----
-slug: /en/engines/table-engines/special/materializedview
-sidebar_position: 100
-sidebar_label: MaterializedView
----
-
-# MaterializedView Table Engine
-
-Used for implementing materialized views (for more information, see [CREATE VIEW](../../../sql-reference/statements/create/view.md#materialized)). For storing data, it uses a different engine that was specified when creating the view. When reading from a table, it just uses that engine.
diff --git a/docs/en/getting-started/example-datasets/youtube-dislikes.md b/docs/en/getting-started/example-datasets/youtube-dislikes.md
index e24c6e5a6dc..a6bbb20cc8d 100644
--- a/docs/en/getting-started/example-datasets/youtube-dislikes.md
+++ b/docs/en/getting-started/example-datasets/youtube-dislikes.md
@@ -25,8 +25,7 @@ The steps below will easily work on a local install of ClickHouse too. The only
 1. Let's see what the data looks like. The `s3cluster` table function returns a table, so we can `DESCRIBE` the result:
 
 ```sql
-DESCRIBE s3Cluster(
-    'default',
+DESCRIBE s3(
     'https://clickhouse-public-datasets.s3.amazonaws.com/youtube/original/files/*.zst',
     'JSONLines'
 );
@@ -35,29 +34,29 @@ DESCRIBE s3Cluster(
 ClickHouse infers the following schema from the JSON file:
 
 ```response
-┌─name────────────────┬─type─────────────────────────────────┐
-│ id                  │ Nullable(String)                     │
-│ fetch_date          │ Nullable(Int64)                      │
-│ upload_date         │ Nullable(String)                     │
-│ title               │ Nullable(String)                     │
-│ uploader_id         │ Nullable(String)                     │
-│ uploader            │ Nullable(String)                     │
-│ uploader_sub_count  │ Nullable(Int64)                      │
-│ is_age_limit        │ Nullable(Bool)                       │
-│ view_count          │ Nullable(Int64)                      │
-│ like_count          │ Nullable(Int64)                      │
-│ dislike_count       │ Nullable(Int64)                      │
-│ is_crawlable        │ Nullable(Bool)                       │
-│ is_live_content     │ Nullable(Bool)                       │
-│ has_subtitles       │ Nullable(Bool)                       │
-│ is_ads_enabled      │ Nullable(Bool)                       │
-│ is_comments_enabled │ Nullable(Bool)                       │
-│ description         │ Nullable(String)                     │
-│ rich_metadata       │ Array(Map(String, Nullable(String))) │
-│ super_titles        │ Array(Map(String, Nullable(String))) │
-│ uploader_badges     │ Nullable(String)                     │
-│ video_badges        │ Nullable(String)                     │
-└─────────────────────┴──────────────────────────────────────┘
+┌─name────────────────┬─type───────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┬─default_type─┬─default_expression─┬─comment─┬─codec_expression─┬─ttl_expression─┐
+│ id                  │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ fetch_date          │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ upload_date         │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ title               │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ uploader_id         │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ uploader            │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ uploader_sub_count  │ Nullable(Int64)                                                                                                                        │              │                    │         │                  │                │
+│ is_age_limit        │ Nullable(Bool)                                                                                                                         │              │                    │         │                  │                │
+│ view_count          │ Nullable(Int64)                                                                                                                        │              │                    │         │                  │                │
+│ like_count          │ Nullable(Int64)                                                                                                                        │              │                    │         │                  │                │
+│ dislike_count       │ Nullable(Int64)                                                                                                                        │              │                    │         │                  │                │
+│ is_crawlable        │ Nullable(Bool)                                                                                                                         │              │                    │         │                  │                │
+│ is_live_content     │ Nullable(Bool)                                                                                                                         │              │                    │         │                  │                │
+│ has_subtitles       │ Nullable(Bool)                                                                                                                         │              │                    │         │                  │                │
+│ is_ads_enabled      │ Nullable(Bool)                                                                                                                         │              │                    │         │                  │                │
+│ is_comments_enabled │ Nullable(Bool)                                                                                                                         │              │                    │         │                  │                │
+│ description         │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ rich_metadata       │ Array(Tuple(call Nullable(String), content Nullable(String), subtitle Nullable(String), title Nullable(String), url Nullable(String))) │              │                    │         │                  │                │
+│ super_titles        │ Array(Tuple(text Nullable(String), url Nullable(String)))                                                                              │              │                    │         │                  │                │
+│ uploader_badges     │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+│ video_badges        │ Nullable(String)                                                                                                                       │              │                    │         │                  │                │
+└─────────────────────┴────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
 ```
 
 2. Based on the inferred schema, we cleaned up the data types and added a primary key. Define the following table:
@@ -82,13 +81,13 @@ CREATE TABLE youtube
     `is_ads_enabled` Bool,
     `is_comments_enabled` Bool,
     `description` String,
-    `rich_metadata` Array(Map(String, String)),
-    `super_titles` Array(Map(String, String)),
+    `rich_metadata` Array(Tuple(call String, content String, subtitle String, title String, url String)),
+    `super_titles` Array(Tuple(text String, url String)),
     `uploader_badges` String,
     `video_badges` String
 )
 ENGINE = MergeTree
-ORDER BY (uploader, upload_date);
+ORDER BY (uploader, upload_date)
 ```
 
 3. The following command streams the records from the S3 files into the `youtube` table.
diff --git a/docs/en/getting-started/install.md b/docs/en/getting-started/install.md
index 2ea900ba753..e8662ec16fa 100644
--- a/docs/en/getting-started/install.md
+++ b/docs/en/getting-started/install.md
@@ -81,7 +81,7 @@ It is recommended to use official pre-compiled `deb` packages for Debian or Ubun
 sudo apt-get install -y apt-transport-https ca-certificates dirmngr
 GNUPGHOME=$(mktemp -d)
 sudo GNUPGHOME="$GNUPGHOME" gpg --no-default-keyring --keyring /usr/share/keyrings/clickhouse-keyring.gpg --keyserver hkp://keyserver.ubuntu.com:80 --recv-keys 8919F6BD2B48D754
-sudo rm -r "$GNUPGHOME"
+sudo rm -rf "$GNUPGHOME"
 sudo chmod +r /usr/share/keyrings/clickhouse-keyring.gpg
 
 echo "deb [signed-by=/usr/share/keyrings/clickhouse-keyring.gpg] https://packages.clickhouse.com/deb stable main" | sudo tee \
diff --git a/docs/en/interfaces/formats.md b/docs/en/interfaces/formats.md
index 57de0555bf6..836b1f2f637 100644
--- a/docs/en/interfaces/formats.md
+++ b/docs/en/interfaces/formats.md
@@ -478,6 +478,7 @@ The CSV format supports the output of totals and extremes the same way as `TabSe
 - [input_format_csv_allow_whitespace_or_tab_as_delimiter](/docs/en/operations/settings/settings-formats.md/# input_format_csv_allow_whitespace_or_tab_as_delimiter) - Allow to use whitespace or tab as field delimiter in CSV strings. Default value - `false`.
 - [input_format_csv_allow_variable_number_of_columns](/docs/en/operations/settings/settings-formats.md/#input_format_csv_allow_variable_number_of_columns) - allow variable number of columns in CSV format, ignore extra columns and use default values on missing columns. Default value - `false`.
 - [input_format_csv_use_default_on_bad_values](/docs/en/operations/settings/settings-formats.md/#input_format_csv_use_default_on_bad_values) - Allow to set default value to column when CSV field deserialization failed on bad value. Default value - `false`.
+- [input_format_csv_try_infer_numbers_from_strings](/docs/en/operations/settings/settings-formats.md/#input_format_csv_try_infer_numbers_from_strings) - Try to infer numbers from string fields while schema inference. Default value - `false`.
 
 ## CSVWithNames {#csvwithnames}
 
diff --git a/docs/en/interfaces/http.md b/docs/en/interfaces/http.md
index 63f75fb7830..4eeb19cefcf 100644
--- a/docs/en/interfaces/http.md
+++ b/docs/en/interfaces/http.md
@@ -167,7 +167,7 @@ For successful requests that do not return a data table, an empty response body
 
 You can use compression to reduce network traffic when transmitting a large amount of data or for creating dumps that are immediately compressed.
 
-You can use the internal ClickHouse compression format when transmitting data. The compressed data has a non-standard format, and you need `clickhouse-compressor` program to work with it. It is installed with the `clickhouse-client` package. To increase the efficiency of data insertion, you can disable server-side checksum verification by using the [http_native_compression_disable_checksumming_on_decompress](../operations/settings/settings.md#settings-http_native_compression_disable_checksumming_on_decompress) setting.
+You can use the internal ClickHouse compression format when transmitting data. The compressed data has a non-standard format, and you need `clickhouse-compressor` program to work with it. It is installed with the `clickhouse-client` package. To increase the efficiency of data insertion, you can disable server-side checksum verification by using the [http_native_compression_disable_checksumming_on_decompress](../operations/settings/settings.md#http_native_compression_disable_checksumming_on_decompress) setting.
 
 If you specify `compress=1` in the URL, the server will compress the data it sends to you. If you specify `decompress=1` in the URL, the server will decompress the data which you pass in the `POST` method.
 
@@ -183,7 +183,7 @@ You can also choose to use [HTTP compression](https://en.wikipedia.org/wiki/HTTP
 - `snappy`
 
 To send a compressed `POST` request, append the request header `Content-Encoding: compression_method`.
-In order for ClickHouse to compress the response, enable compression with [enable_http_compression](../operations/settings/settings.md#settings-enable_http_compression) setting and append `Accept-Encoding: compression_method` header to the request. You can configure the data compression level in the [http_zlib_compression_level](../operations/settings/settings.md#settings-http_zlib_compression_level) setting for all compression methods.
+In order for ClickHouse to compress the response, enable compression with [enable_http_compression](../operations/settings/settings.md#enable_http_compression) setting and append `Accept-Encoding: compression_method` header to the request. You can configure the data compression level in the [http_zlib_compression_level](../operations/settings/settings.md#http_zlib_compression_level) setting for all compression methods.
 
 :::info
 Some HTTP clients might decompress data from the server by default (with `gzip` and `deflate`) and you might get decompressed data even if you use the compression settings correctly.
@@ -285,7 +285,7 @@ For information about other parameters, see the section “SET”.
 
 Similarly, you can use ClickHouse sessions in the HTTP protocol. To do this, you need to add the `session_id` GET parameter to the request. You can use any string as the session ID. By default, the session is terminated after 60 seconds of inactivity. To change this timeout, modify the `default_session_timeout` setting in the server configuration, or add the `session_timeout` GET parameter to the request. To check the session status, use the `session_check=1` parameter. Only one query at a time can be executed within a single session.
 
-You can receive information about the progress of a query in `X-ClickHouse-Progress` response headers. To do this, enable [send_progress_in_http_headers](../operations/settings/settings.md#settings-send_progress_in_http_headers). Example of the header sequence:
+You can receive information about the progress of a query in `X-ClickHouse-Progress` response headers. To do this, enable [send_progress_in_http_headers](../operations/settings/settings.md#send_progress_in_http_headers). Example of the header sequence:
 
 ``` text
 X-ClickHouse-Progress: {"read_rows":"2752512","read_bytes":"240570816","total_rows_to_read":"8880128","elapsed_ns":"662334"}
@@ -496,7 +496,7 @@ Next are the configuration methods for different `type`.
 
 `query` value is a predefined query of `predefined_query_handler`, which is executed by ClickHouse when an HTTP request is matched and the result of the query is returned. It is a must configuration.
 
-The following example defines the values of [max_threads](../operations/settings/settings.md#settings-max_threads) and `max_final_threads` settings, then queries the system table to check whether these settings were set successfully.
+The following example defines the values of [max_threads](../operations/settings/settings.md#max_threads) and `max_final_threads` settings, then queries the system table to check whether these settings were set successfully.
 
 :::note
 To keep the default `handlers` such as` query`, `play`,` ping`, add the `<defaults/>` rule.
@@ -539,7 +539,7 @@ In `dynamic_query_handler`, the query is written in the form of parameter of the
 
 ClickHouse extracts and executes the value corresponding to the `query_param_name` value in the URL of the HTTP request. The default value of `query_param_name` is `/query` . It is an optional configuration. If there is no definition in the configuration file, the parameter is not passed in.
 
-To experiment with this functionality, the example defines the values of [max_threads](../operations/settings/settings.md#settings-max_threads) and `max_final_threads` and `queries` whether the settings were set successfully.
+To experiment with this functionality, the example defines the values of [max_threads](../operations/settings/settings.md#max_threads) and `max_final_threads` and `queries` whether the settings were set successfully.
 
 Example:
 
diff --git a/docs/en/interfaces/overview.md b/docs/en/interfaces/overview.md
index e60aff927c4..0e09ab6a0b7 100644
--- a/docs/en/interfaces/overview.md
+++ b/docs/en/interfaces/overview.md
@@ -25,6 +25,7 @@ ClickHouse server provides embedded visual interfaces for power users:
 
 - Play UI: open `/play` in the browser;
 - Advanced Dashboard: open `/dashboard` in the browser;
+- Binary symbols viewer for ClickHouse engineers: open `/binary` in the browser;
 
 There are also a wide range of third-party libraries for working with ClickHouse:
 
diff --git a/docs/en/interfaces/schema-inference.md b/docs/en/interfaces/schema-inference.md
index 0aadb09730a..ef858796936 100644
--- a/docs/en/interfaces/schema-inference.md
+++ b/docs/en/interfaces/schema-inference.md
@@ -834,6 +834,27 @@ $$)
 └──────────────┴───────────────┘
 ```
 
+#### CSV settings {#csv-settings}
+
+##### input_format_csv_try_infer_numbers_from_strings
+
+Enabling this setting allows inferring numbers from string values.
+
+This setting is disabled by default.
+
+**Example:**
+
+```sql
+SET input_format_json_try_infer_numbers_from_strings = 1;
+DESC format(CSV, '"42","42.42"');
+```
+```reponse
+┌─name─┬─type──────────────┬─default_type─┬─default_expression─┬─comment─┬─codec_expression─┬─ttl_expression─┐
+│ c1   │ Nullable(Int64)   │              │                    │         │                  │                │
+│ c2   │ Nullable(Float64) │              │                    │         │                  │                │
+└──────┴───────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
+```
+
 ### TSV/TSKV {#tsv-tskv}
 
 In TSV/TSKV formats ClickHouse extracts column value from the row according to tabular delimiters and then parses extracted value using
@@ -1846,3 +1867,102 @@ DESC format(JSONAsString, '{"x" : 42, "y" : "Hello, World!"}') SETTINGS allow_ex
 │ json │ Object('json') │              │                    │         │                  │                │
 └──────┴────────────────┴──────────────┴────────────────────┴─────────┴──────────────────┴────────────────┘
 ```
+
+## Schema inference modes {#schema-inference-modes}
+
+Schema inference from the set of data files can work in 2 different modes: `default` and `union`.
+The mode is controlled by the setting `schema_inference_mode`. 
+
+### Default mode {#default-schema-inference-mode}
+
+In default mode, ClickHouse assumes that all files have the same schema and tries to infer the schema by reading files one by one until it succeeds.
+
+Example:
+
+Let's say we have 3 files `data1.jsonl`, `data2.jsonl` and `data3.jsonl` with the next content:
+
+`data1.jsonl`:
+```json
+{"field1" :  1, "field2" :  null}
+{"field1" :  2, "field2" :  null}
+{"field1" :  3, "field2" :  null}
+```
+
+`data2.jsonl`:
+```json
+{"field1" :  4, "field2" :  "Data4"}
+{"field1" :  5, "field2" :  "Data5"}
+{"field1" :  6, "field2" :  "Data5"}
+```
+
+`data3.jsonl`:
+```json
+{"field1" :  7, "field2" :  "Data7", "field3" :  [1, 2, 3]}
+{"field1" :  8, "field2" :  "Data8", "field3" :  [4, 5, 6]}
+{"field1" :  9, "field2" :  "Data9", "field3" :  [7, 8, 9]}
+```
+
+Let's try to use schema inference on these 3 files:
+```sql
+:) DESCRIBE file('data{1,2,3}.jsonl') SETTINGS schema_inference_mode='default'
+```
+
+Result:
+```text
+┌─name───┬─type─────────────┐
+│ field1 │ Nullable(Int64)  │
+│ field2 │ Nullable(String) │
+└────────┴──────────────────┘
+```
+
+As we can see, we don't have `field3` from file `data3.jsonl`. 
+It happens because ClickHouse first tried to infer schema from file `data1.jsonl`, failed because of only nulls for field `field2`,
+and then tried to infer schema from `data2.jsonl` and succeeded, so data from file `data3.jsonl` wasn't read.
+
+### Union mode {#default-schema-inference-mode}
+
+In union mode, ClickHouse assumes that files can have different schemas, so it infer schemas of all files and then union them to the common schema. 
+
+Let's say we have 3 files `data1.jsonl`, `data2.jsonl` and `data3.jsonl` with the next content:
+
+`data1.jsonl`:
+```json
+{"field1" :  1}
+{"field1" :  2}
+{"field1" :  3}
+```
+
+`data2.jsonl`:
+```json
+{"field2" :  "Data4"}
+{"field2" :  "Data5"}
+{"field2" :  "Data5"}
+```
+
+`data3.jsonl`:
+```json
+{"field3" :  [1, 2, 3]}
+{"field3" :  [4, 5, 6]}
+{"field3" :  [7, 8, 9]}
+```
+
+Let's try to use schema inference on these 3 files:
+```sql
+:) DESCRIBE file('data{1,2,3}.jsonl') SETTINGS schema_inference_mode='union'
+```
+
+Result:
+```text
+┌─name───┬─type───────────────────┐
+│ field1 │ Nullable(Int64)        │
+│ field2 │ Nullable(String)       │
+│ field3 │ Array(Nullable(Int64)) │
+└────────┴────────────────────────┘
+```
+
+As we can see, we have all fields from all files.
+
+Note:
+- As some of the files may not contain some columns from the resulting schema, union mode is supported only for formats that support reading subset of columns (like JSONEachRow, Parquet, TSVWithNames, etc) and won't work for other formats (like CSV, TSV, JSONCompactEachRow, etc).
+- If ClickHouse cannot infer the schema from one of the files, the exception will be thrown.
+- If you have a lot of files, reading schema from all of them can take a lot of time.
diff --git a/docs/en/operations/backup.md b/docs/en/operations/backup.md
index 6068b185ede..d45885ee816 100644
--- a/docs/en/operations/backup.md
+++ b/docs/en/operations/backup.md
@@ -406,7 +406,7 @@ RESTORE TABLE data AS data_restored FROM Disk('s3_plain', 'cloud_backup');
 :::note
 But keep in mind that:
 - This disk should not be used for `MergeTree` itself, only for `BACKUP`/`RESTORE`
-- If your tables are backed by S3 storage, it doesn't use `CopyObject` calls to copy parts to the destination bucket, instead, it downloads and uploads them, which is very inefficient. Prefer to use `BACKUP ... TO S3(<endpoint>)` syntax for this use-case.
+- If your tables are backed by S3 storage and types of the disks are different, it doesn't use `CopyObject` calls to copy parts to the destination bucket, instead, it downloads and uploads them, which is very inefficient. Prefer to use `BACKUP ... TO S3(<endpoint>)` syntax for this use-case.
 :::
 
 ## Alternatives
diff --git a/docs/en/operations/monitoring.md b/docs/en/operations/monitoring.md
index ebf981690a9..de61da6f5c4 100644
--- a/docs/en/operations/monitoring.md
+++ b/docs/en/operations/monitoring.md
@@ -15,6 +15,27 @@ You can monitor:
 - Utilization of hardware resources.
 - ClickHouse server metrics.
 
+## Built-in observability dashboard
+
+<img width="400" alt="Screenshot 2023-11-12 at 6 08 58 PM" src="https://github.com/ClickHouse/ClickHouse/assets/3936029/2bd10011-4a47-4b94-b836-d44557c7fdc1" />
+
+ClickHouse comes with a built-in observability dashboard feature which can be accessed by `$HOST:$PORT/dashboard` (requires user and password) that shows the following metrics:
+- Queries/second
+- CPU usage (cores)
+- Queries running
+- Merges running
+- Selected bytes/second
+- IO wait
+- CPU wait
+- OS CPU Usage (userspace)
+- OS CPU Usage (kernel)
+- Read from disk
+- Read from filesystem
+- Memory (tracked)
+- Inserted rows/second
+- Total MergeTree parts
+- Max parts for partition
+
 ## Resource Utilization {#resource-utilization}
 
 ClickHouse also monitors the state of hardware resources by itself such as:
@@ -43,4 +64,4 @@ You can configure ClickHouse to export metrics to [Prometheus](https://prometheu
 
 Additionally, you can monitor server availability through the HTTP API. Send the `HTTP GET` request to `/ping`. If the server is available, it responds with `200 OK`.
 
-To monitor servers in a cluster configuration, you should set the [max_replica_delay_for_distributed_queries](../operations/settings/settings.md#settings-max_replica_delay_for_distributed_queries) parameter and use the HTTP resource `/replicas_status`. A request to `/replicas_status` returns `200 OK` if the replica is available and is not delayed behind the other replicas. If a replica is delayed, it returns `503 HTTP_SERVICE_UNAVAILABLE` with information about the gap.
+To monitor servers in a cluster configuration, you should set the [max_replica_delay_for_distributed_queries](../operations/settings/settings.md#max_replica_delay_for_distributed_queries) parameter and use the HTTP resource `/replicas_status`. A request to `/replicas_status` returns `200 OK` if the replica is available and is not delayed behind the other replicas. If a replica is delayed, it returns `503 HTTP_SERVICE_UNAVAILABLE` with information about the gap.
diff --git a/docs/en/operations/optimizing-performance/sampling-query-profiler.md b/docs/en/operations/optimizing-performance/sampling-query-profiler.md
index 206f710734e..194d2714422 100644
--- a/docs/en/operations/optimizing-performance/sampling-query-profiler.md
+++ b/docs/en/operations/optimizing-performance/sampling-query-profiler.md
@@ -42,7 +42,7 @@ To analyze the `trace_log` system table:
 
 - Install the `clickhouse-common-static-dbg` package. See [Install from DEB Packages](../../getting-started/install.md#install-from-deb-packages).
 
-- Allow introspection functions by the [allow_introspection_functions](../../operations/settings/settings.md#settings-allow_introspection_functions) setting.
+- Allow introspection functions by the [allow_introspection_functions](../../operations/settings/settings.md#allow_introspection_functions) setting.
 
     For security reasons, introspection functions are disabled by default.
 
diff --git a/docs/en/operations/query-cache.md b/docs/en/operations/query-cache.md
index def0f48b968..50c5ff4457f 100644
--- a/docs/en/operations/query-cache.md
+++ b/docs/en/operations/query-cache.md
@@ -29,6 +29,10 @@ Transactionally inconsistent caching is traditionally provided by client tools o
 the same caching logic and configuration is often duplicated. With ClickHouse's query cache, the caching logic moves to the server side.
 This reduces maintenance effort and avoids redundancy.
 
+:::note
+Security consideration: The cached query result is tied to the user executing it. Authorization checks are performed when the query is executed. This means that if there are any alterations to the user's role or permissions between the time the query is cached and when the cache is accessed, the result will not reflect these changes. We recommend using different users to distinguish between different levels of access, instead of actively toggling roles for a single user between queries, as this practice may lead to unexpected query results.
+:::
+
 ## Configuration Settings and Usage
 
 Setting [use_query_cache](settings/settings.md#use-query-cache) can be used to control whether a specific query or all queries of the
@@ -99,7 +103,7 @@ It is also possible to limit the cache usage of individual users using [settings
 constraints](settings/constraints-on-settings.md). More specifically, you can restrict the maximum amount of memory (in bytes) a user may
 allocate in the query cache and the maximum number of stored query results. For that, first provide configurations
 [query_cache_max_size_in_bytes](settings/settings.md#query-cache-max-size-in-bytes) and
-[query_cache_max_entries](settings/settings.md#query-cache-size-max-entries) in a user profile in `users.xml`, then make both settings
+[query_cache_max_entries](settings/settings.md#query-cache-max-entries) in a user profile in `users.xml`, then make both settings
 readonly:
 
 ``` xml
@@ -140,7 +144,7 @@ value can be specified at session, profile or query level using setting [query_c
 Entries in the query cache are compressed by default. This reduces the overall memory consumption at the cost of slower writes into / reads
 from the query cache. To disable compression, use setting [query_cache_compress_entries](settings/settings.md#query-cache-compress-entries).
 
-ClickHouse reads table data in blocks of [max_block_size](settings/settings.md#settings-max_block_size) rows. Due to filtering, aggregation,
+ClickHouse reads table data in blocks of [max_block_size](settings/settings.md#setting-max_block_size) rows. Due to filtering, aggregation,
 etc., result blocks are typically much smaller than 'max_block_size' but there are also cases where they are much bigger. Setting
 [query_cache_squash_partial_results](settings/settings.md#query-cache-squash-partial-results) (enabled by default) controls if result blocks
 are squashed (if they are tiny) or split (if they are large) into blocks of 'max_block_size' size before insertion into the query result
diff --git a/docs/en/operations/server-configuration-parameters/settings.md b/docs/en/operations/server-configuration-parameters/settings.md
index cc2692b8e02..48434d992e2 100644
--- a/docs/en/operations/server-configuration-parameters/settings.md
+++ b/docs/en/operations/server-configuration-parameters/settings.md
@@ -472,6 +472,39 @@ The value 0 means that you can delete all tables without any restrictions.
 ``` xml
 <max_table_size_to_drop>0</max_table_size_to_drop>
 ```
+  
+
+## max\_database\_num\_to\_warn {#max-database-num-to-warn}  
+If the number of attached databases exceeds the specified value, clickhouse server will add warning messages to `system.warnings` table.    
+Default value: 1000
+
+**Example**
+
+``` xml
+<max_database_num_to_warn>50</max_database_num_to_warn>
+```
+  
+## max\_table\_num\_to\_warn {#max-table-num-to-warn}   
+If the number of attached tables exceeds the specified value, clickhouse server will add warning messages to `system.warnings` table.  
+Default value: 5000    
+
+**Example**
+
+``` xml
+<max_table_num_to_warn>400</max_table_num_to_warn>
+```
+
+
+## max\_part\_num\_to\_warn {#max-part-num-to-warn}  
+If the number of active parts exceeds the specified value, clickhouse server will add warning messages to `system.warnings` table.  
+Default value: 100000  
+
+**Example**
+
+``` xml
+<max_part_num_to_warn>400</max_part_num_to_warn>
+```
+
 
 ## max_temporary_data_on_disk_size
 
@@ -1650,7 +1683,7 @@ Default value: `0.5`.
 
 Asynchronous loading of databases and tables.
 
-If `true` all non-system databases with `Ordinary`, `Atomic` and `Replicated` engine will be loaded asynchronously after the ClickHouse server start up. See `system.async_loader` table, `tables_loader_background_pool_size` and `tables_loader_foreground_pool_size` server settings. Any query that tries to access a table, that is not yet loaded, will wait for exactly this table to be started up. If load job fails, query will rethrow an error (instead of shutting down the whole server in case of `async_load_databases = false`). The table that is waited for by at least one query will be loaded with higher priority. DDL queries on a database will wait for exactly that database to be started up.
+If `true` all non-system databases with `Ordinary`, `Atomic` and `Replicated` engine will be loaded asynchronously after the ClickHouse server start up. See `system.asynchronous_loader` table, `tables_loader_background_pool_size` and `tables_loader_foreground_pool_size` server settings. Any query that tries to access a table, that is not yet loaded, will wait for exactly this table to be started up. If load job fails, query will rethrow an error (instead of shutting down the whole server in case of `async_load_databases = false`). The table that is waited for by at least one query will be loaded with higher priority. DDL queries on a database will wait for exactly that database to be started up.
 
 If `false`, all databases are loaded when the server starts.
 
@@ -1976,7 +2009,7 @@ Data for the query cache is allocated in DRAM. If memory is scarce, make sure to
 
 ## query_thread_log {#query_thread_log}
 
-Setting for logging threads of queries received with the [log_query_threads=1](../../operations/settings/settings.md#settings-log-query-threads) setting.
+Setting for logging threads of queries received with the [log_query_threads=1](../../operations/settings/settings.md#log-query-threads) setting.
 
 Queries are logged in the [system.query_thread_log](../../operations/system-tables/query_thread_log.md#system_tables-query_thread_log) table, not in a separate file. You can change the name of the table in the `table` parameter (see below).
 
@@ -2018,7 +2051,7 @@ If the table does not exist, ClickHouse will create it. If the structure of the
 
 ## query_views_log {#query_views_log}
 
-Setting for logging views (live, materialized etc) dependant of queries received with the [log_query_views=1](../../operations/settings/settings.md#settings-log-query-views) setting.
+Setting for logging views (live, materialized etc) dependant of queries received with the [log_query_views=1](../../operations/settings/settings.md#log-query-views) setting.
 
 Queries are logged in the [system.query_views_log](../../operations/system-tables/query_views_log.md#system_tables-query_views_log) table, not in a separate file. You can change the name of the table in the `table` parameter (see below).
 
@@ -2298,7 +2331,7 @@ For the value of the `incl` attribute, see the section “[Configuration files](
 
 **See Also**
 
-- [skip_unavailable_shards](../../operations/settings/settings.md#settings-skip_unavailable_shards)
+- [skip_unavailable_shards](../../operations/settings/settings.md#skip_unavailable_shards)
 - [Cluster Discovery](../../operations/cluster-discovery.md)
 - [Replicated database engine](../../engines/database-engines/replicated.md)
 
diff --git a/docs/en/operations/settings/query-complexity.md b/docs/en/operations/settings/query-complexity.md
index 9e36aa26946..1cb7ec9dced 100644
--- a/docs/en/operations/settings/query-complexity.md
+++ b/docs/en/operations/settings/query-complexity.md
@@ -139,7 +139,7 @@ Limit on the number of bytes in the result. The same as the previous setting.
 
 What to do if the volume of the result exceeds one of the limits: ‘throw’ or ‘break’. By default, throw.
 
-Using ‘break’ is similar to using LIMIT. `Break` interrupts execution only at the block level. This means that amount of returned rows is greater than [max_result_rows](#setting-max_result_rows), multiple of [max_block_size](../../operations/settings/settings.md#setting-max_block_size) and depends on [max_threads](../../operations/settings/settings.md#settings-max_threads).
+Using ‘break’ is similar to using LIMIT. `Break` interrupts execution only at the block level. This means that amount of returned rows is greater than [max_result_rows](#setting-max_result_rows), multiple of [max_block_size](../../operations/settings/settings.md#setting-max_block_size) and depends on [max_threads](../../operations/settings/settings.md#max_threads).
 
 Example:
 
diff --git a/docs/en/operations/settings/settings-formats.md b/docs/en/operations/settings/settings-formats.md
index 344e6dda680..3d76bd9df73 100644
--- a/docs/en/operations/settings/settings-formats.md
+++ b/docs/en/operations/settings/settings-formats.md
@@ -1130,6 +1130,13 @@ Result
 a  0  1971-01-01
 ```
 
+## input_format_csv_try_infer_numbers_from_strings {#input_format_csv_try_infer_numbers_from_strings}
+
+If enabled, during schema inference ClickHouse will try to infer numbers from string fields.
+It can be useful if CSV data contains quoted UInt64 numbers.
+
+Disabled by default.
+
 ## Values format settings {#values-format-settings}
 
 ### input_format_values_interpret_expressions {#input_format_values_interpret_expressions}
diff --git a/docs/en/operations/settings/settings-users.md b/docs/en/operations/settings/settings-users.md
index 1f41eafd02e..96477f777a9 100644
--- a/docs/en/operations/settings/settings-users.md
+++ b/docs/en/operations/settings/settings-users.md
@@ -4,7 +4,7 @@ sidebar_position: 63
 sidebar_label: User Settings
 ---
 
-# User Settings
+# Users and Roles Settings
 
 The `users` section of the `user.xml` configuration file contains user settings.
 
@@ -187,3 +187,34 @@ The following configuration forces that user `user1` can only see the rows of `t
 ```
 
 The `filter` can be any expression resulting in a [UInt8](../../sql-reference/data-types/int-uint.md)-type value. It usually contains comparisons and logical operators. Rows from `database_name.table1` where filter results to 0 are not returned for this user. The filtering is incompatible with `PREWHERE` operations and disables `WHERE→PREWHERE` optimization.
+
+## Roles
+
+You can create any predefined roles using the `roles` section of the `user.xml` configuration file.
+
+Structure of the `roles` section:
+
+```xml
+<roles>
+    <test_role>
+        <grants>
+            <query>GRANT SHOW ON *.*</query>
+            <query>REVOKE SHOW ON system.*</query>
+            <query>GRANT CREATE ON *.* WITH GRANT OPTION</query>
+        </grants>
+    </test_role>
+</roles>
+```
+
+These roles can also be granted to users from the `users` section:
+
+```xml
+<users>
+    <user_name>
+        ...
+        <grants>
+            <query>GRANT test_role</query>
+        </grants>
+    </user_name>
+<users>
+```
diff --git a/docs/en/operations/settings/settings.md b/docs/en/operations/settings/settings.md
index c8d54d76704..6e087467bb9 100644
--- a/docs/en/operations/settings/settings.md
+++ b/docs/en/operations/settings/settings.md
@@ -460,6 +460,12 @@ Possible values:
 
 Default value: 1048576.
 
+## http_make_head_request {#http-make-head-request}
+
+The `http_make_head_request` setting allows the execution of a `HEAD` request while reading data from HTTP to retrieve information about the file to be read, such as its size. Since it's enabled by default, it may be desirable to disable this setting in cases where the server does not support `HEAD` requests.
+
+Default value: `true`.
+
 ## table_function_remote_max_addresses {#table_function_remote_max_addresses}
 
 Sets the maximum number of addresses generated from patterns for the [remote](../../sql-reference/table-functions/remote.md) function.
@@ -1578,9 +1584,15 @@ Default value: `default`.
 
 ## allow_experimental_parallel_reading_from_replicas
 
-If true, ClickHouse will send a SELECT query to all replicas of a table (up to `max_parallel_replicas`) . It will work for any kind of MergeTree table.
+Enables or disables sending SELECT queries to all replicas of a table (up to `max_parallel_replicas`). Reading is parallelized and coordinated dynamically. It will work for any kind of MergeTree table.
 
-Default value: `false`.
+Possible values:
+
+- 0 - Disabled.
+- 1 - Enabled, silently disabled in case of failure.
+- 2 - Enabled, throws an exception in case of failure.
+
+Default value: `0`.
 
 ## compile_expressions {#compile-expressions}
 
@@ -1704,7 +1716,7 @@ Default value: `1`
 
 ## query_cache_squash_partial_results {#query-cache-squash-partial-results}
 
-Squash partial result blocks to blocks of size [max_block_size](#setting-max_block_size). Reduces performance of inserts into the [query cache](../query-cache.md) but improves the compressability of cache entries (see [query_cache_compress-entries](#query_cache_compress_entries)).
+Squash partial result blocks to blocks of size [max_block_size](#setting-max_block_size). Reduces performance of inserts into the [query cache](../query-cache.md) but improves the compressability of cache entries (see [query_cache_compress-entries](#query-cache-compress-entries)).
 
 Possible values:
 
@@ -2474,7 +2486,7 @@ See also:
 - [load_balancing](#load_balancing-round_robin)
 - [Table engine Distributed](../../engines/table-engines/special/distributed.md)
 - [distributed_replica_error_cap](#distributed_replica_error_cap)
-- [distributed_replica_error_half_life](#settings-distributed_replica_error_half_life)
+- [distributed_replica_error_half_life](#distributed_replica_error_half_life)
 
 ## distributed_background_insert_sleep_time_ms {#distributed_background_insert_sleep_time_ms}
 
@@ -2647,7 +2659,7 @@ Default value: 0.
 
 ## input_format_parallel_parsing {#input-format-parallel-parsing}
 
-Enables or disables order-preserving parallel parsing of data formats. Supported only for [TSV](../../interfaces/formats.md/#tabseparated), [TKSV](../../interfaces/formats.md/#tskv), [CSV](../../interfaces/formats.md/#csv) and [JSONEachRow](../../interfaces/formats.md/#jsoneachrow) formats.
+Enables or disables order-preserving parallel parsing of data formats. Supported only for [TSV](../../interfaces/formats.md/#tabseparated), [TSKV](../../interfaces/formats.md/#tskv), [CSV](../../interfaces/formats.md/#csv) and [JSONEachRow](../../interfaces/formats.md/#jsoneachrow) formats.
 
 Possible values:
 
@@ -2658,7 +2670,7 @@ Default value: `1`.
 
 ## output_format_parallel_formatting {#output-format-parallel-formatting}
 
-Enables or disables parallel formatting of data formats. Supported only for [TSV](../../interfaces/formats.md/#tabseparated), [TKSV](../../interfaces/formats.md/#tskv), [CSV](../../interfaces/formats.md/#csv) and [JSONEachRow](../../interfaces/formats.md/#jsoneachrow) formats.
+Enables or disables parallel formatting of data formats. Supported only for [TSV](../../interfaces/formats.md/#tabseparated), [TSKV](../../interfaces/formats.md/#tskv), [CSV](../../interfaces/formats.md/#csv) and [JSONEachRow](../../interfaces/formats.md/#jsoneachrow) formats.
 
 Possible values:
 
@@ -4152,6 +4164,41 @@ Result:
 └─────┴─────┴───────┘
 ```
 
+## enable_order_by_all {#enable-order-by-all}
+
+Enables or disables sorting by `ALL` columns, i.e. [ORDER BY](../../sql-reference/statements/select/order-by.md)
+
+Possible values:
+
+- 0 — Disable ORDER BY ALL.
+- 1 — Enable ORDER BY ALL.
+
+Default value: `1`.
+
+**Example**
+
+Query:
+
+```sql
+CREATE TABLE TAB(C1 Int, C2 Int, ALL Int) ENGINE=Memory();
+
+INSERT INTO TAB VALUES (10, 20, 30), (20, 20, 10), (30, 10, 20);
+
+SELECT * FROM TAB ORDER BY ALL; -- returns an error that ALL is ambiguous
+
+SELECT * FROM TAB ORDER BY ALL SETTINGS enable_order_by_all;
+```
+
+Result:
+
+```text
+┌─C1─┬─C2─┬─ALL─┐
+│ 20 │ 20 │  10 │
+│ 30 │ 10 │  20 │
+│ 10 │ 20 │  30 │
+└────┴────┴─────┘
+```
+
 ## splitby_max_substrings_includes_remaining_string {#splitby_max_substrings_includes_remaining_string}
 
 Controls whether function [splitBy*()](../../sql-reference/functions/splitting-merging-functions.md) with argument `max_substrings` > 0 will include the remaining string in the last element of the result array.
@@ -4349,6 +4396,8 @@ Default value: `1GiB`.
 
 ## Schema Inference settings
 
+See [schema inference](../../interfaces/schema-inference.md#schema-inference-modes) documentation for more details.
+
 ### schema_inference_use_cache_for_file {schema_inference_use_cache_for_file}
 
 Enable schemas cache for schema inference in `file` table function.
@@ -4390,6 +4439,13 @@ Possible values:
 
 Default value: 2.
 
+### schema_inference_mode {schema_inference_mode}
+
+The mode of schema inference. Possible values: `default` and `union`.
+See [schema inference modes](../../interfaces/schema-inference.md#schema-inference-modes) section for more details.
+
+Default value: `default`.
+
 ## compatibility {#compatibility}
 
 The `compatibility` setting causes ClickHouse to use the default settings of a previous version of ClickHouse, where the previous version is provided as the setting.
@@ -4659,7 +4715,7 @@ Possible values:
 
 Default value: `false`.
 
-## rename_files_after_processing
+## rename_files_after_processing {#rename_files_after_processing}
 
 - **Type:** String
 
@@ -5078,3 +5134,25 @@ When set to `true` than for all s3 requests first two attempts are made with low
 When set to `false` than all attempts are made with identical timeouts.
 
 Default value: `true`.
+
+## max_partition_size_to_drop
+
+Restriction on dropping partitions in query time.
+
+Default value: 50 GB.
+The value 0 means that you can drop partitions without any restrictions.
+
+:::note
+This query setting overwrites its server setting equivalent, see [max_partition_size_to_drop](/docs/en/operations/server-configuration-parameters/settings.md/#max-partition-size-to-drop)
+:::
+
+## max_table_size_to_drop
+
+Restriction on deleting tables in query time.
+
+Default value: 50 GB.
+The value 0 means that you can delete all tables without any restrictions.
+
+:::note
+This query setting overwrites its server setting equivalent, see [max_table_size_to_drop](/docs/en/operations/server-configuration-parameters/settings.md/#max-table-size-to-drop)
+:::
\ No newline at end of file
diff --git a/docs/en/operations/storing-data.md b/docs/en/operations/storing-data.md
index 796f65a9d30..b3ef1128c42 100644
--- a/docs/en/operations/storing-data.md
+++ b/docs/en/operations/storing-data.md
@@ -196,7 +196,7 @@ These settings should be defined in the disk configuration section.
 
 - `max_elements` - a limit for a number of cache files. Default: `10000000`.
 
-- `load_metadata_threads` - number of threads being used to load cache metadata on starting time. Default: `1`.
+- `load_metadata_threads` - number of threads being used to load cache metadata on starting time. Default: `16`.
 
 File Cache **query/profile settings**:
 
diff --git a/docs/en/operations/system-tables/asynchronous_insert_log.md b/docs/en/operations/system-tables/asynchronous_insert_log.md
index c3aaa8e6c41..d5f6ab07b10 100644
--- a/docs/en/operations/system-tables/asynchronous_insert_log.md
+++ b/docs/en/operations/system-tables/asynchronous_insert_log.md
@@ -13,6 +13,7 @@ ClickHouse does not delete data from the table automatically. See [Introduction]
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — The date when the async insert happened.
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the async insert finished execution.
 - `event_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — The date and time when the async insert finished execution with microseconds precision.
@@ -42,6 +43,7 @@ SELECT * FROM system.asynchronous_insert_log LIMIT 1 \G;
 Result:
 
 ``` text
+hostname:                clickhouse.eu-central1.internal
 event_date:              2023-06-08
 event_time:              2023-06-08 10:08:53
 event_time_microseconds: 2023-06-08 10:08:53.199516
diff --git a/docs/en/operations/system-tables/async_loader.md b/docs/en/operations/system-tables/asynchronous_loader.md
similarity index 97%
rename from docs/en/operations/system-tables/async_loader.md
rename to docs/en/operations/system-tables/asynchronous_loader.md
index 4e8651a6d3e..af9aa4ecd09 100644
--- a/docs/en/operations/system-tables/async_loader.md
+++ b/docs/en/operations/system-tables/asynchronous_loader.md
@@ -1,7 +1,7 @@
 ---
-slug: /en/operations/system-tables/async_loader
+slug: /en/operations/system-tables/asynchronous_loader
 ---
-# async_loader
+# asynchronous_loader
 
 Contains information and status for recent asynchronous jobs (e.g. for tables loading). The table contains a row for every job. There is a tool for visualizing information from this table `utils/async_loader_graph`.
 
@@ -9,7 +9,7 @@ Example:
 
 ``` sql
 SELECT *
-FROM system.async_loader
+FROM system.asynchronous_loader
 FORMAT Vertical
 LIMIT 1
 ```
diff --git a/docs/en/operations/system-tables/asynchronous_metric_log.md b/docs/en/operations/system-tables/asynchronous_metric_log.md
index efe57a202d8..65b2e349707 100644
--- a/docs/en/operations/system-tables/asynchronous_metric_log.md
+++ b/docs/en/operations/system-tables/asynchronous_metric_log.md
@@ -7,6 +7,7 @@ Contains the historical values for `system.asynchronous_metrics`, which are save
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — Event date.
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Event time.
 - `name` ([String](../../sql-reference/data-types/string.md)) — Metric name.
@@ -15,22 +16,33 @@ Columns:
 **Example**
 
 ``` sql
-SELECT * FROM system.asynchronous_metric_log LIMIT 10
+SELECT * FROM system.asynchronous_metric_log LIMIT 3 \G
 ```
 
 ``` text
-┌─event_date─┬──────────event_time─┬─name─────────────────────────────────────┬─────value─┐
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ CPUFrequencyMHz_0                        │    2120.9 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.arenas.all.pmuzzy               │       743 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.arenas.all.pdirty               │     26288 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.background_thread.run_intervals │         0 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.background_thread.num_runs      │         0 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.retained                        │  60694528 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.mapped                          │ 303161344 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.resident                        │ 260931584 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.metadata                        │  12079488 │
-│ 2020-09-05 │ 2020-09-05 15:56:30 │ jemalloc.allocated                       │ 133756128 │
-└────────────┴─────────────────────┴──────────────────────────────────────────┴───────────┘
+Row 1:
+──────
+hostname:   clickhouse.eu-central1.internal
+event_date: 2023-11-14
+event_time: 2023-11-14 14:39:07
+metric:     AsynchronousHeavyMetricsCalculationTimeSpent
+value:      0.001
+
+Row 2:
+──────
+hostname:   clickhouse.eu-central1.internal
+event_date: 2023-11-14
+event_time: 2023-11-14 14:39:08
+metric:     AsynchronousHeavyMetricsCalculationTimeSpent
+value:      0
+
+Row 3:
+──────
+hostname:   clickhouse.eu-central1.internal
+event_date: 2023-11-14
+event_time: 2023-11-14 14:39:09
+metric:     AsynchronousHeavyMetricsCalculationTimeSpent
+value:      0
 ```
 
 **See Also**
diff --git a/docs/en/operations/system-tables/asynchronous_metrics.md b/docs/en/operations/system-tables/asynchronous_metrics.md
index e46b495239c..fe8f963b1ec 100644
--- a/docs/en/operations/system-tables/asynchronous_metrics.md
+++ b/docs/en/operations/system-tables/asynchronous_metrics.md
@@ -239,6 +239,10 @@ The amount of virtual memory mapped for the pages of machine code of the server
 
 The amount of virtual memory mapped for the use of stack and for the allocated memory, in bytes. It is unspecified whether it includes the per-thread stacks and most of the allocated memory, that is allocated with the 'mmap' system call. This metric exists only for completeness reasons. I recommend to use the `MemoryResident` metric for monitoring.
 
+### MemoryResidentMax
+
+Maximum amount of physical memory used by the server process, in bytes.
+
 ### MemoryResident
 
 The amount of physical memory used by the server process, in bytes.
@@ -547,6 +551,14 @@ Total amount of bytes (compressed, including data and indices) stored in all tab
 
 Total amount of data parts in all tables of MergeTree family. Numbers larger than 10 000 will negatively affect the server startup time and it may indicate unreasonable choice of the partition key.
 
+### TotalPrimaryKeyBytesInMemory
+
+The total amount of memory (in bytes) used by primary key values (only takes active parts into account).
+
+### TotalPrimaryKeyBytesInMemoryAllocated
+
+The total amount of memory (in bytes) reserved for primary key values (only takes active parts into account).
+
 ### TotalRowsOfMergeTreeTables
 
 Total amount of rows (records) stored in all tables of MergeTree family.
diff --git a/docs/en/operations/system-tables/backup_log.md b/docs/en/operations/system-tables/backup_log.md
index 7e088fcad94..c73fd26683e 100644
--- a/docs/en/operations/system-tables/backup_log.md
+++ b/docs/en/operations/system-tables/backup_log.md
@@ -7,6 +7,7 @@ Contains logging entries with the information about `BACKUP` and `RESTORE` opera
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — Date of the entry.
 - `event_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — Time of the entry with microseconds precision.
 - `id` ([String](../../sql-reference/data-types/string.md)) — Identifier of the backup or restore operation.
@@ -45,6 +46,7 @@ SELECT * FROM system.backup_log WHERE id = 'e5b74ecb-f6f1-426a-80be-872f90043885
 ```response
 Row 1:
 ──────
+hostname:                clickhouse.eu-central1.internal
 event_date:              2023-08-19
 event_time_microseconds: 2023-08-19 11:05:21.998566
 id:                      e5b74ecb-f6f1-426a-80be-872f90043885
@@ -63,6 +65,7 @@ bytes_read:              0
 
 Row 2:
 ──────
+hostname:                clickhouse.eu-central1.internal
 event_date:              2023-08-19
 event_time_microseconds: 2023-08-19 11:08:56.916192
 id:                      e5b74ecb-f6f1-426a-80be-872f90043885
@@ -93,6 +96,7 @@ SELECT * FROM system.backup_log WHERE id = 'cdf1f731-52ef-42da-bc65-2e1bfcd4ce90
 ```response
 Row 1:
 ──────
+hostname:                clickhouse.eu-central1.internal
 event_date:              2023-08-19
 event_time_microseconds: 2023-08-19 11:09:19.718077
 id:                      cdf1f731-52ef-42da-bc65-2e1bfcd4ce90
@@ -111,6 +115,7 @@ bytes_read:              0
 
 Row 2:
 ──────
+hostname:                clickhouse.eu-central1.internal
 event_date:              2023-08-19
 event_time_microseconds: 2023-08-19 11:09:29.334234
 id:                      cdf1f731-52ef-42da-bc65-2e1bfcd4ce90
diff --git a/docs/en/operations/system-tables/clusters.md b/docs/en/operations/system-tables/clusters.md
index 2659f80e338..63cc083e4bc 100644
--- a/docs/en/operations/system-tables/clusters.md
+++ b/docs/en/operations/system-tables/clusters.md
@@ -78,5 +78,5 @@ is_active:               NULL
 **See Also**
 
 - [Table engine Distributed](../../engines/table-engines/special/distributed.md)
-- [distributed_replica_error_cap setting](../../operations/settings/settings.md#settings-distributed_replica_error_cap)
-- [distributed_replica_error_half_life setting](../../operations/settings/settings.md#settings-distributed_replica_error_half_life)
+- [distributed_replica_error_cap setting](../../operations/settings/settings.md#distributed_replica_error_cap)
+- [distributed_replica_error_half_life setting](../../operations/settings/settings.md#distributed_replica_error_half_life)
diff --git a/docs/en/operations/system-tables/crash-log.md b/docs/en/operations/system-tables/crash-log.md
index 4d015a513a2..e83da3624b2 100644
--- a/docs/en/operations/system-tables/crash-log.md
+++ b/docs/en/operations/system-tables/crash-log.md
@@ -7,6 +7,7 @@ Contains information about stack traces for fatal errors. The table does not exi
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([DateTime](../../sql-reference/data-types/datetime.md)) — Date of the event.
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Time of the event.
 - `timestamp_ns` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Timestamp of the event with nanoseconds.
@@ -32,6 +33,7 @@ Result (not full):
 ``` text
 Row 1:
 ──────
+hostname:     clickhouse.eu-central1.internal
 event_date:   2020-10-14
 event_time:   2020-10-14 15:47:40
 timestamp_ns: 1602679660271312710
diff --git a/docs/en/operations/system-tables/database_engines.md b/docs/en/operations/system-tables/database_engines.md
new file mode 100644
index 00000000000..09f0687af65
--- /dev/null
+++ b/docs/en/operations/system-tables/database_engines.md
@@ -0,0 +1,26 @@
+---
+slug: /en/operations/system-tables/database_engines
+---
+# database_engines
+
+Contains the list of database engines supported by the server.
+
+This table contains the following columns (the column type is shown in brackets):
+
+- `name` (String) — The name of database engine.
+
+Example:
+
+``` sql
+SELECT *
+FROM system.database_engines
+WHERE name in ('Atomic', 'Lazy', 'Ordinary')
+```
+
+``` text
+┌─name─────┐
+│ Ordinary │
+│ Atomic   │
+│ Lazy     │
+└──────────┘
+```
diff --git a/docs/en/operations/system-tables/errors.md b/docs/en/operations/system-tables/errors.md
index 01762962152..4582ea631b3 100644
--- a/docs/en/operations/system-tables/errors.md
+++ b/docs/en/operations/system-tables/errors.md
@@ -9,11 +9,15 @@ Columns:
 
 - `name` ([String](../../sql-reference/data-types/string.md)) — name of the error (`errorCodeToName`).
 - `code` ([Int32](../../sql-reference/data-types/int-uint.md)) — code number of the error.
-- `value` ([UInt64](../../sql-reference/data-types/int-uint.md)) — the number of times this error has been happened.
-- `last_error_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — time when the last error happened.
+- `value` ([UInt64](../../sql-reference/data-types/int-uint.md)) — the number of times this error happened.
+- `last_error_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — the time when the last error happened.
 - `last_error_message` ([String](../../sql-reference/data-types/string.md)) — message for the last error.
-- `last_error_trace` ([Array(UInt64)](../../sql-reference/data-types/array.md)) — A [stack trace](https://en.wikipedia.org/wiki/Stack_trace) which represents a list of physical addresses where the called methods are stored.
-- `remote` ([UInt8](../../sql-reference/data-types/int-uint.md)) — remote exception (i.e. received during one of the distributed query).
+- `last_error_trace` ([Array(UInt64)](../../sql-reference/data-types/array.md)) — A [stack trace](https://en.wikipedia.org/wiki/Stack_trace) that represents a list of physical addresses where the called methods are stored.
+- `remote` ([UInt8](../../sql-reference/data-types/int-uint.md)) — remote exception (i.e. received during one of the distributed queries).
+
+:::note
+Counters for some errors may increase during successful query execution. It's not recommended to use this table for server monitoring purposes unless you are sure that corresponding error can not be a false positive.
+:::
 
 **Example**
 
diff --git a/docs/en/operations/system-tables/metric_log.md b/docs/en/operations/system-tables/metric_log.md
index 9ea0dde3f80..f0b717a3bbf 100644
--- a/docs/en/operations/system-tables/metric_log.md
+++ b/docs/en/operations/system-tables/metric_log.md
@@ -6,6 +6,7 @@ slug: /en/operations/system-tables/metric_log
 Contains history of metrics values from tables `system.metrics` and `system.events`, periodically flushed to disk.
 
 Columns:
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — Event date.
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Event time.
 - `event_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — Event time with microseconds resolution.
@@ -19,6 +20,7 @@ SELECT * FROM system.metric_log LIMIT 1 FORMAT Vertical;
 ``` text
 Row 1:
 ──────
+hostname:                                                        clickhouse.eu-central1.internal
 event_date:                                                      2020-09-05
 event_time:                                                      2020-09-05 16:22:33
 event_time_microseconds:                                         2020-09-05 16:22:33.196807
diff --git a/docs/en/operations/system-tables/opentelemetry_span_log.md b/docs/en/operations/system-tables/opentelemetry_span_log.md
index a605a46c14c..5f03c2f8ada 100644
--- a/docs/en/operations/system-tables/opentelemetry_span_log.md
+++ b/docs/en/operations/system-tables/opentelemetry_span_log.md
@@ -8,28 +8,19 @@ Contains information about [trace spans](https://opentracing.io/docs/overview/sp
 Columns:
 
 - `trace_id` ([UUID](../../sql-reference/data-types/uuid.md)) — ID of the trace for executed query.
-
 - `span_id` ([UInt64](../../sql-reference/data-types/int-uint.md)) — ID of the `trace span`.
-
 - `parent_span_id` ([UInt64](../../sql-reference/data-types/int-uint.md)) — ID of the parent `trace span`.
-
 - `operation_name` ([String](../../sql-reference/data-types/string.md)) — The name of the operation.
-
 - `kind` ([Enum8](../../sql-reference/data-types/enum.md)) — The [SpanKind](https://opentelemetry.io/docs/reference/specification/trace/api/#spankind) of the span.
     - `INTERNAL` — Indicates that the span represents an internal operation within an application.
     - `SERVER` — Indicates that the span covers server-side handling of a synchronous RPC or other remote request.
     - `CLIENT` — Indicates that the span describes a request to some remote service.
     - `PRODUCER` — Indicates that the span describes the initiators of an asynchronous request. This parent span will often end before the corresponding child CONSUMER span, possibly even before the child span starts.
     - `CONSUMER` - Indicates that the span describes a child of an asynchronous PRODUCER request.
-
 - `start_time_us` ([UInt64](../../sql-reference/data-types/int-uint.md)) — The start time of the `trace span` (in microseconds).
-
 - `finish_time_us` ([UInt64](../../sql-reference/data-types/int-uint.md)) — The finish time of the `trace span` (in microseconds).
-
 - `finish_date` ([Date](../../sql-reference/data-types/date.md)) — The finish date of the `trace span`.
-
 - `attribute.names` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) — [Attribute](https://opentelemetry.io/docs/go/instrumentation/#attributes) names depending on the `trace span`. They are filled in according to the recommendations in the [OpenTelemetry](https://opentelemetry.io/) standard.
-
 - `attribute.values` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) — Attribute values depending on the `trace span`. They are filled in according to the recommendations in the `OpenTelemetry` standard.
 
 **Example**
diff --git a/docs/en/operations/system-tables/part_log.md b/docs/en/operations/system-tables/part_log.md
index b9185434e01..af582646653 100644
--- a/docs/en/operations/system-tables/part_log.md
+++ b/docs/en/operations/system-tables/part_log.md
@@ -9,6 +9,7 @@ This table contains information about events that occurred with [data parts](../
 
 The `system.part_log` table contains the following columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `query_id` ([String](../../sql-reference/data-types/string.md)) — Identifier of the `INSERT` query that created this data part.
 - `event_type` ([Enum8](../../sql-reference/data-types/enum.md)) — Type of the event that occurred with the data part. Can have one of the following values:
     - `NewPart` — Inserting of a new data part.
@@ -56,13 +57,14 @@ SELECT * FROM system.part_log LIMIT 1 FORMAT Vertical;
 ``` text
 Row 1:
 ──────
+hostname:                      clickhouse.eu-central1.internal
 query_id:                      983ad9c7-28d5-4ae1-844e-603116b7de31
 event_type:                    NewPart
 merge_reason:                  NotAMerge
 merge_algorithm:               Undecided
 event_date:                    2021-02-02
 event_time:                    2021-02-02 11:14:28
-event_time_microseconds:                    2021-02-02 11:14:28.861919
+event_time_microseconds:       2021-02-02 11:14:28.861919
 duration_ms:                   35
 database:                      default
 table:                         log_mt_2
diff --git a/docs/en/operations/system-tables/processors_profile_log.md b/docs/en/operations/system-tables/processors_profile_log.md
index 5eedb5a5dae..3c2a090efe3 100644
--- a/docs/en/operations/system-tables/processors_profile_log.md
+++ b/docs/en/operations/system-tables/processors_profile_log.md
@@ -4,6 +4,7 @@ This table contains profiling on processors level (that you can find in [`EXPLAI
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — The date when the event happened.
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the event happened.
 - `event_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — The date and time with microseconds precision when the event happened.
diff --git a/docs/en/operations/system-tables/query_log.md b/docs/en/operations/system-tables/query_log.md
index ced97166702..7fcc4928355 100644
--- a/docs/en/operations/system-tables/query_log.md
+++ b/docs/en/operations/system-tables/query_log.md
@@ -11,7 +11,7 @@ This table does not contain the ingested data for `INSERT` queries.
 
 You can change settings of queries logging in the [query_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-query-log) section of the server configuration.
 
-You can disable queries logging by setting [log_queries = 0](../../operations/settings/settings.md#settings-log-queries). We do not recommend to turn off logging because information in this table is important for solving issues.
+You can disable queries logging by setting [log_queries = 0](../../operations/settings/settings.md#log-queries). We do not recommend to turn off logging because information in this table is important for solving issues.
 
 The flushing period of data is set in `flush_interval_milliseconds` parameter of the [query_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-query-log) server settings section. To force flushing, use the [SYSTEM FLUSH LOGS](../../sql-reference/statements/system.md#query_language-system-flush_logs) query.
 
@@ -30,10 +30,11 @@ Each query creates one or two rows in the `query_log` table, depending on the st
 
 You can use the [log_queries_probability](../../operations/settings/settings.md#log-queries-probability) setting to reduce the number of queries, registered in the `query_log` table.
 
-You can use the [log_formatted_queries](../../operations/settings/settings.md#settings-log-formatted-queries) setting to log formatted queries to the `formatted_query` column.
+You can use the [log_formatted_queries](../../operations/settings/settings.md#log-formatted-queries) setting to log formatted queries to the `formatted_query` column.
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `type` ([Enum8](../../sql-reference/data-types/enum.md)) — Type of an event that occurred when executing the query. Values:
     - `'QueryStart' = 1` — Successful start of query execution.
     - `'QueryFinish' = 2` — Successful end of query execution.
@@ -100,7 +101,7 @@ Columns:
 - `revision` ([UInt32](../../sql-reference/data-types/int-uint.md)) — ClickHouse revision.
 - `ProfileEvents` ([Map(String, UInt64)](../../sql-reference/data-types/map.md)) — ProfileEvents that measure different metrics. The description of them could be found in the table [system.events](../../operations/system-tables/events.md#system_tables-events)
 - `Settings` ([Map(String, String)](../../sql-reference/data-types/map.md)) — Settings that were changed when the client ran the query. To enable logging changes to settings, set the `log_query_settings` parameter to 1.
-- `log_comment` ([String](../../sql-reference/data-types/string.md)) — Log comment. It can be set to arbitrary string no longer than [max_query_size](../../operations/settings/settings.md#settings-max_query_size). An empty string if it is not defined.
+- `log_comment` ([String](../../sql-reference/data-types/string.md)) — Log comment. It can be set to arbitrary string no longer than [max_query_size](../../operations/settings/settings.md#max_query_size). An empty string if it is not defined.
 - `thread_ids` ([Array(UInt64)](../../sql-reference/data-types/array.md)) — Thread ids that are participating in query execution. These threads may not have run simultaneously.
 - `peak_threads_usage` ([UInt64)](../../sql-reference/data-types/int-uint.md)) — Maximum count of simultaneous threads executing the query.
 - `used_aggregate_functions` ([Array(String)](../../sql-reference/data-types/array.md)) — Canonical names of `aggregate functions`, which were used during query execution.
@@ -127,6 +128,7 @@ SELECT * FROM system.query_log WHERE type = 'QueryFinish' ORDER BY query_start_t
 ``` text
 Row 1:
 ──────
+hostname:                              clickhouse.eu-central1.internal
 type:                                  QueryFinish
 event_date:                            2021-11-03
 event_time:                            2021-11-03 16:13:54
@@ -167,7 +169,7 @@ initial_query_start_time:              2021-11-03 16:13:54
 initial_query_start_time_microseconds: 2021-11-03 16:13:54.952325
 interface:                             1
 os_user:                               sevirov
-client_hostname:                       clickhouse.ru-central1.internal
+client_hostname:                       clickhouse.eu-central1.internal
 client_name:                           ClickHouse
 client_revision:                       54449
 client_version_major:                  21
diff --git a/docs/en/operations/system-tables/query_thread_log.md b/docs/en/operations/system-tables/query_thread_log.md
index a6d5632ade9..0420a0392f2 100644
--- a/docs/en/operations/system-tables/query_thread_log.md
+++ b/docs/en/operations/system-tables/query_thread_log.md
@@ -8,7 +8,7 @@ Contains information about threads that execute queries, for example, thread nam
 To start logging:
 
 1.  Configure parameters in the [query_thread_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-query_thread_log) section.
-2.  Set [log_query_threads](../../operations/settings/settings.md#settings-log-query-threads) to 1.
+2.  Set [log_query_threads](../../operations/settings/settings.md#log-query-threads) to 1.
 
 The flushing period of data is set in `flush_interval_milliseconds` parameter of the [query_thread_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-query_thread_log) server settings section. To force flushing, use the [SYSTEM FLUSH LOGS](../../sql-reference/statements/system.md#query_language-system-flush_logs) query.
 
@@ -18,6 +18,7 @@ You can use the [log_queries_probability](../../operations/settings/settings.md#
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — The date when the thread has finished execution of the query.
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the thread has finished execution of the query.
 - `event_time_microsecinds` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the thread has finished execution of the query with microseconds precision.
@@ -74,6 +75,7 @@ Columns:
 ``` text
 Row 1:
 ──────
+hostname:                      clickhouse.eu-central1.internal
 event_date:                    2020-09-11
 event_time:                    2020-09-11 10:08:17
 event_time_microseconds:       2020-09-11 10:08:17.134042
diff --git a/docs/en/operations/system-tables/query_views_log.md b/docs/en/operations/system-tables/query_views_log.md
index e107e4f926c..41a69da70aa 100644
--- a/docs/en/operations/system-tables/query_views_log.md
+++ b/docs/en/operations/system-tables/query_views_log.md
@@ -8,7 +8,7 @@ Contains information about the dependent views executed when running a query, fo
 To start logging:
 
 1. Configure parameters in the [query_views_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-query_views_log) section.
-2. Set [log_query_views](../../operations/settings/settings.md#settings-log-query-views) to 1.
+2. Set [log_query_views](../../operations/settings/settings.md#log-query-views) to 1.
 
 The flushing period of data is set in `flush_interval_milliseconds` parameter of the [query_views_log](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-query_views_log) server settings section. To force flushing, use the [SYSTEM FLUSH LOGS](../../sql-reference/statements/system.md#query_language-system-flush_logs) query.
 
@@ -18,6 +18,7 @@ You can use the [log_queries_probability](../../operations/settings/settings.md#
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — The date when the last event of the view happened.
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the view finished execution.
 - `event_time_microseconds` ([DateTime](../../sql-reference/data-types/datetime.md)) — The date and time when the view finished execution with microseconds precision.
@@ -59,6 +60,7 @@ Result:
 ``` text
 Row 1:
 ──────
+hostname:                clickhouse.eu-central1.internal
 event_date:              2021-06-22
 event_time:              2021-06-22 13:23:07
 event_time_microseconds: 2021-06-22 13:23:07.738221
diff --git a/docs/en/operations/system-tables/session_log.md b/docs/en/operations/system-tables/session_log.md
index 5b1a2b2a489..5c6096b3adf 100644
--- a/docs/en/operations/system-tables/session_log.md
+++ b/docs/en/operations/system-tables/session_log.md
@@ -7,6 +7,7 @@ Contains information about all successful and failed login and logout events.
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `type` ([Enum8](../../sql-reference/data-types/enum.md)) — Login/logout result. Possible values:
     - `LoginFailure` — Login error.
     - `LoginSuccess` — Successful login.
@@ -57,6 +58,7 @@ Result:
 ``` text
 Row 1:
 ──────
+hostname:                clickhouse.eu-central1.internal
 type:                    LoginSuccess
 auth_id:                 45e6bd83-b4aa-4a23-85e6-bd83b4aa1a23
 session_id:
diff --git a/docs/en/operations/system-tables/storage_policies.md b/docs/en/operations/system-tables/storage_policies.md
index 5c7184b2b22..24271a943a4 100644
--- a/docs/en/operations/system-tables/storage_policies.md
+++ b/docs/en/operations/system-tables/storage_policies.md
@@ -17,7 +17,7 @@ Columns:
     - `UNKNOWN`
 - `max_data_part_size` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Maximum size of a data part that can be stored on volume disks (0 — no limit).
 - `move_factor` ([Float64](../../sql-reference/data-types/float.md)) — Ratio of free disk space. When the ratio exceeds the value of configuration parameter, ClickHouse start to move data to the next volume in order.
-- `prefer_not_to_merge` ([UInt8](../../sql-reference/data-types/int-uint.md)) — Value of the `prefer_not_to_merge` setting. When this setting is enabled, merging data on this volume is not allowed. This allows controlling how ClickHouse works with slow disks.
+- `prefer_not_to_merge` ([UInt8](../../sql-reference/data-types/int-uint.md)) — Value of the `prefer_not_to_merge` setting. Should be always false. When this setting is enabled, you did a mistake.
 - `perform_ttl_move_on_insert` ([UInt8](../../sql-reference/data-types/int-uint.md)) — Value of the `perform_ttl_move_on_insert` setting. — Disables TTL move on data part INSERT. By default if we insert a data part that already expired by the TTL move rule it immediately goes to a volume/disk declared in move rule. This can significantly slowdown insert in case if destination volume/disk is slow (e.g. S3).
 - `load_balancing` ([Enum8](../../sql-reference/data-types/enum.md))  — Policy for disk balancing. Can have one of the following values:
     - `ROUND_ROBIN`
diff --git a/docs/en/operations/system-tables/table_engines.md b/docs/en/operations/system-tables/table_engines.md
index 08594739ecf..56668abae31 100644
--- a/docs/en/operations/system-tables/table_engines.md
+++ b/docs/en/operations/system-tables/table_engines.md
@@ -14,7 +14,7 @@ This table contains the following columns (the column type is shown in brackets)
 - `supports_sort_order` (UInt8) — Flag that indicates if table engine supports clauses `PARTITION_BY`, `PRIMARY_KEY`, `ORDER_BY` and `SAMPLE_BY`.
 - `supports_replication` (UInt8) — Flag that indicates if table engine supports [data replication](../../engines/table-engines/mergetree-family/replication.md).
 - `supports_duduplication` (UInt8) — Flag that indicates if table engine supports data deduplication.
-- `supports_parallel_insert` (UInt8) — Flag that indicates if table engine supports parallel insert (see [`max_insert_threads`](../../operations/settings/settings.md#settings-max-insert-threads) setting).
+- `supports_parallel_insert` (UInt8) — Flag that indicates if table engine supports parallel insert (see [`max_insert_threads`](../../operations/settings/settings.md#max-insert-threads) setting).
 
 Example:
 
diff --git a/docs/en/operations/system-tables/tables.md b/docs/en/operations/system-tables/tables.md
index e4461e14236..8049ab091c0 100644
--- a/docs/en/operations/system-tables/tables.md
+++ b/docs/en/operations/system-tables/tables.md
@@ -29,7 +29,7 @@ Columns:
 
 - `dependencies_database` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) - Database dependencies.
 
-- `dependencies_table` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) - Table dependencies ([MaterializedView](../../engines/table-engines/special/materializedview.md) tables based on the current table).
+- `dependencies_table` ([Array](../../sql-reference/data-types/array.md)([String](../../sql-reference/data-types/string.md))) - Table dependencies ([materialized views](../../sql-reference/statements/create/view.md#materialized-view) the current table).
 
 - `create_table_query` ([String](../../sql-reference/data-types/string.md)) - The query that was used to create the table.
 
@@ -57,6 +57,8 @@ Columns:
     - If the table stores data on disk, returns used space on disk (i.e. compressed).
     - If the table stores data in memory, returns approximated number of used bytes in memory.
 
+- `total_bytes_uncompressed` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) - Total number of uncompressed bytes, if it's possible to quickly determine the exact number of bytes from the part checksums for the table on storage, otherwise `NULL` (does not take underlying storage (if any) into account).
+
 - `lifetime_rows` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) - Total number of rows INSERTed since server start (only for `Buffer` tables).
 
 - `lifetime_bytes` ([Nullable](../../sql-reference/data-types/nullable.md)([UInt64](../../sql-reference/data-types/int-uint.md))) - Total number of bytes INSERTed since server start (only for `Buffer` tables).
diff --git a/docs/en/operations/system-tables/text_log.md b/docs/en/operations/system-tables/text_log.md
index 897cefab0be..6ac1ddbf667 100644
--- a/docs/en/operations/system-tables/text_log.md
+++ b/docs/en/operations/system-tables/text_log.md
@@ -7,6 +7,7 @@ Contains logging entries. The logging level which goes to this table can be limi
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` (Date) — Date of the entry.
 - `event_time` (DateTime) — Time of the entry.
 - `event_time_microseconds` (DateTime) — Time of the entry with microseconds precision.
@@ -39,6 +40,7 @@ SELECT * FROM system.text_log LIMIT 1 \G
 ``` text
 Row 1:
 ──────
+hostname:                clickhouse.eu-central1.internal
 event_date:              2020-09-10
 event_time:              2020-09-10 11:23:07
 event_time_microseconds: 2020-09-10 11:23:07.871397
diff --git a/docs/en/operations/system-tables/trace_log.md b/docs/en/operations/system-tables/trace_log.md
index 983b5b5c176..5adc33de37f 100644
--- a/docs/en/operations/system-tables/trace_log.md
+++ b/docs/en/operations/system-tables/trace_log.md
@@ -12,37 +12,27 @@ To analyze logs, use the `addressToLine`, `addressToLineWithInlines`, `addressTo
 
 Columns:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `event_date` ([Date](../../sql-reference/data-types/date.md)) — Date of sampling moment.
-
 - `event_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Timestamp of the sampling moment.
-
 - `event_time_microseconds` ([DateTime64](../../sql-reference/data-types/datetime64.md)) — Timestamp of the sampling moment with microseconds precision.
-
 - `timestamp_ns` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Timestamp of the sampling moment in nanoseconds.
-
 - `revision` ([UInt32](../../sql-reference/data-types/int-uint.md)) — ClickHouse server build revision.
 
     When connecting to the server by `clickhouse-client`, you see the string similar to `Connected to ClickHouse server version 19.18.1.`. This field contains the `revision`, but not the `version` of a server.
 
 - `trace_type` ([Enum8](../../sql-reference/data-types/enum.md)) — Trace type:
-
     - `Real` represents collecting stack traces by wall-clock time.
     - `CPU` represents collecting stack traces by CPU time.
     - `Memory` represents collecting allocations and deallocations when memory allocation exceeds the subsequent watermark.
     - `MemorySample` represents collecting random allocations and deallocations.
     - `MemoryPeak` represents collecting updates of peak memory usage.
     - `ProfileEvent` represents collecting of increments of profile events.
-
 - `thread_id` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Thread identifier.
-
 - `query_id` ([String](../../sql-reference/data-types/string.md)) — Query identifier that can be used to get details about a query that was running from the [query_log](#system_tables-query_log) system table.
-
 - `trace` ([Array(UInt64)](../../sql-reference/data-types/array.md)) — Stack trace at the moment of sampling. Each element is a virtual memory address inside ClickHouse server process.
-
 - `size` ([Int64](../../sql-reference/data-types/int-uint.md)) - For trace types `Memory`, `MemorySample` or `MemoryPeak` is the amount of memory allocated, for other trace types is 0.
-
 - `event` ([LowCardinality(String)](../../sql-reference/data-types/lowcardinality.md)) - For trace type `ProfileEvent` is the name of updated profile event, for other trace types is an empty string.
-
 - `increment` ([UInt64](../../sql-reference/data-types/int-uint.md)) - For trace type `ProfileEvent` is the amount of increment of profile event, for other trace types is 0.
 
 **Example**
@@ -54,6 +44,7 @@ SELECT * FROM system.trace_log LIMIT 1 \G
 ``` text
 Row 1:
 ──────
+hostname:                clickhouse.eu-central1.internal
 event_date:              2020-09-10
 event_time:              2020-09-10 11:23:09
 event_time_microseconds: 2020-09-10 11:23:09.872924
diff --git a/docs/en/operations/system-tables/view_refreshes.md b/docs/en/operations/system-tables/view_refreshes.md
new file mode 100644
index 00000000000..12377507b39
--- /dev/null
+++ b/docs/en/operations/system-tables/view_refreshes.md
@@ -0,0 +1,43 @@
+---
+slug: /en/operations/system-tables/view_refreshes
+---
+# view_refreshes
+
+Information about [Refreshable Materialized Views](../../sql-reference/statements/create/view.md#refreshable-materialized-view). Contains all refreshable materialized views, regardless of whether there's a refresh in progress or not.
+
+
+Columns:
+
+- `database` ([String](../../sql-reference/data-types/string.md)) — The name of the database the table is in.
+- `view` ([String](../../sql-reference/data-types/string.md)) — Table name.
+- `status` ([String](../../sql-reference/data-types/string.md)) — Current state of the refresh.
+- `last_refresh_result` ([String](../../sql-reference/data-types/string.md)) — Outcome of the latest refresh attempt.
+- `last_refresh_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Time of the last refresh attempt. `NULL` if no refresh attempts happened since server startup or table creation.
+- `last_success_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Time of the last successful refresh. `NULL` if no successful refreshes happened since server startup or table creation.
+- `duration_ms` ([UInt64](../../sql-reference/data-types/int-uint.md)) — How long the last refresh attempt took.
+- `next_refresh_time` ([DateTime](../../sql-reference/data-types/datetime.md)) — Time at which the next refresh is scheduled to start.
+- `remaining_dependencies` ([Array(String)](../../sql-reference/data-types/array.md)) — If the view has [refresh dependencies](../../sql-reference/statements/create/view.md#refresh-dependencies), this array contains the subset of those dependencies that are not satisfied for the current refresh yet. If `status = 'WaitingForDependencies'`, a refresh is ready to start as soon as these dependencies are fulfilled.
+- `exception` ([String](../../sql-reference/data-types/string.md)) — if `last_refresh_result = 'Exception'`, i.e. the last refresh attempt failed, this column contains the corresponding error message and stack trace.
+- `refresh_count` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Number of successful refreshes since last server restart or table creation.
+- `progress` ([Float64](../../sql-reference/data-types/float.md)) — Progress of the current refresh, between 0 and 1.
+- `read_rows` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Number of rows read by the current refresh so far.
+- `total_rows` ([UInt64](../../sql-reference/data-types/int-uint.md)) — Estimated total number of rows that need to be read by the current refresh.
+
+(There are additional columns related to current refresh progress, but they are currently unreliable.)
+
+**Example**
+
+```sql
+SELECT
+    database,
+    view,
+    status,
+    last_refresh_result,
+    last_refresh_time,
+    next_refresh_time
+FROM system.view_refreshes
+
+┌─database─┬─view───────────────────────┬─status────┬─last_refresh_result─┬───last_refresh_time─┬───next_refresh_time─┐
+│ default  │ hello_documentation_reader │ Scheduled │ Finished            │ 2023-12-01 01:24:00 │ 2023-12-01 01:25:00 │
+└──────────┴────────────────────────────┴───────────┴─────────────────────┴─────────────────────┴─────────────────────┘
+```
diff --git a/docs/en/operations/system-tables/zookeeper_log.md b/docs/en/operations/system-tables/zookeeper_log.md
index dce5be29f62..dd2df2ba5fc 100644
--- a/docs/en/operations/system-tables/zookeeper_log.md
+++ b/docs/en/operations/system-tables/zookeeper_log.md
@@ -9,6 +9,7 @@ For requests, only columns with request parameters are filled in, and the remain
 
 Columns with request parameters:
 
+- `hostname` ([LowCardinality(String)](../../sql-reference/data-types/string.md)) — Hostname of the server executing the query.
 - `type` ([Enum](../../sql-reference/data-types/enum.md)) — Event type in the ZooKeeper client. Can have one of the following values:
     - `Request` — The request has been sent.
     - `Response` — The response was received.
@@ -63,6 +64,7 @@ Result:
 ``` text
 Row 1:
 ──────
+hostname:         clickhouse.eu-central1.internal
 type:             Request
 event_date:       2021-08-09
 event_time:       2021-08-09 21:38:30.291792
diff --git a/docs/en/operations/tips.md b/docs/en/operations/tips.md
index 8f6cf6ad147..757afff599c 100644
--- a/docs/en/operations/tips.md
+++ b/docs/en/operations/tips.md
@@ -93,7 +93,7 @@ While ClickHouse can work over NFS, it is not the best idea.
 
 ## Linux Kernel {#linux-kernel}
 
-Don’t use an outdated Linux kernel.
+Don't use an outdated Linux kernel.
 
 ## Network {#network}
 
diff --git a/docs/en/operations/utilities/clickhouse-benchmark.md b/docs/en/operations/utilities/clickhouse-benchmark.md
index 8620b44c368..8b7d7f85552 100644
--- a/docs/en/operations/utilities/clickhouse-benchmark.md
+++ b/docs/en/operations/utilities/clickhouse-benchmark.md
@@ -53,7 +53,6 @@ clickhouse-benchmark [keys] < queries_file;
 - `--confidence=N` — Level of confidence for T-test. Possible values: 0 (80%), 1 (90%), 2 (95%), 3 (98%), 4 (99%), 5 (99.5%). Default value: 5. In the [comparison mode](#clickhouse-benchmark-comparison-mode) `clickhouse-benchmark` performs the [Independent two-sample Student’s t-test](https://en.wikipedia.org/wiki/Student%27s_t-test#Independent_two-sample_t-test) to determine whether the two distributions aren’t different with the selected level of confidence.
 - `--cumulative` — Printing cumulative data instead of data per interval.
 - `--database=DATABASE_NAME` — ClickHouse database name. Default value: `default`.
-- `--json=FILEPATH` — `JSON` output. When the key is set, `clickhouse-benchmark` outputs a report to the specified JSON-file.
 - `--user=USERNAME` — ClickHouse user name. Default value: `default`.
 - `--password=PSWD` — ClickHouse user password. Default value: empty string.
 - `--stacktrace` — Stack traces output. When the key is set, `clickhouse-bencmark` outputs stack traces of exceptions.
diff --git a/docs/en/sql-reference/aggregate-functions/parametric-functions.md b/docs/en/sql-reference/aggregate-functions/parametric-functions.md
index 5fbbf8f723c..3654cd157e9 100644
--- a/docs/en/sql-reference/aggregate-functions/parametric-functions.md
+++ b/docs/en/sql-reference/aggregate-functions/parametric-functions.md
@@ -487,24 +487,23 @@ Where:
 
 ## uniqUpTo(N)(x)
 
-Calculates the number of different argument values ​​if it is less than or equal to N. If the number of different argument values is greater than N, it returns N + 1.
+Calculates the number of different values of the argument up to a specified limit, `N`. If the number of different argument values is greater than `N`, this function returns `N` + 1, otherwise it calculates the exact value. 
 
-Recommended for use with small Ns, up to 10. The maximum value of N is 100.
+Recommended for use with small `N`s, up to 10. The maximum value of `N` is 100.
 
-For the state of an aggregate function, it uses the amount of memory equal to 1 + N \* the size of one value of bytes.
-For strings, it stores a non-cryptographic hash of 8 bytes. That is, the calculation is approximated for strings.
+For the state of an aggregate function, this function uses the amount of memory equal to 1 + `N` \* the size of one value of bytes.
+When dealing with strings, this function stores a non-cryptographic hash of 8 bytes; the calculation is approximated for strings.
 
-The function also works for several arguments.
+For example, if you had a table that logs every search query made by users on your website. Each row in the table represents a single search query, with columns for the user ID, the search query, and the timestamp of the query. You can use `uniqUpTo` to generate a report that shows only the keywords that produced at least 5 unique users.
 
-It works as fast as possible, except for cases when a large N value is used and the number of unique values is slightly less than N.
-
-Usage example:
-
-``` text
-Problem: Generate a report that shows only keywords that produced at least 5 unique users.
-Solution: Write in the GROUP BY query SearchPhrase HAVING uniqUpTo(4)(UserID) >= 5
+```sql
+SELECT SearchPhrase
+FROM SearchLog
+GROUP BY SearchPhrase
+HAVING uniqUpTo(4)(UserID) >= 5
 ```
 
+`uniqUpTo(4)(UserID)` calculates the number of unique `UserID` values for each `SearchPhrase`, but it only counts up to 4 unique values. If there are more than 4 unique `UserID` values for a `SearchPhrase`, the function returns 5 (4 + 1). The `HAVING` clause then filters out the `SearchPhrase` values for which the number of unique `UserID` values is less than 5. This will give you a list of search keywords that were used by at least 5 unique users.
 
 ## sumMapFiltered(keys_to_keep)(keys, values)
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/count.md b/docs/en/sql-reference/aggregate-functions/reference/count.md
index a40108a331a..ca4067c8d8c 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/count.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/count.md
@@ -28,7 +28,7 @@ In both cases the type of the returned value is [UInt64](../../../sql-reference/
 
 **Details**
 
-ClickHouse supports the `COUNT(DISTINCT ...)` syntax. The behavior of this construction depends on the [count_distinct_implementation](../../../operations/settings/settings.md#settings-count_distinct_implementation) setting. It defines which of the [uniq\*](../../../sql-reference/aggregate-functions/reference/uniq.md#agg_function-uniq) functions is used to perform the operation. The default is the [uniqExact](../../../sql-reference/aggregate-functions/reference/uniqexact.md#agg_function-uniqexact) function.
+ClickHouse supports the `COUNT(DISTINCT ...)` syntax. The behavior of this construction depends on the [count_distinct_implementation](../../../operations/settings/settings.md#count_distinct_implementation) setting. It defines which of the [uniq\*](../../../sql-reference/aggregate-functions/reference/uniq.md#agg_function-uniq) functions is used to perform the operation. The default is the [uniqExact](../../../sql-reference/aggregate-functions/reference/uniqexact.md#agg_function-uniqexact) function.
 
 The `SELECT count() FROM table` query is optimized by default using metadata from MergeTree. If you need to use row-level security, disable optimization using the [optimize_trivial_count_query](../../../operations/settings/settings.md#optimize-trivial-count-query) setting.
 
diff --git a/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md b/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
deleted file mode 100644
index cc601c097fe..00000000000
--- a/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md
+++ /dev/null
@@ -1,48 +0,0 @@
- ---
- toc_priority: 112
- ---
-
- # groupArraySorted {#groupArraySorted}
-
- Returns an array with the first N items in ascending order.
-
- ``` sql
- groupArraySorted(N)(column)
- ```
-
- **Arguments**
-
- -   `N` – The number of elements to return.
-
- If the parameter is omitted, default value is the size of input.
-
- -   `column` – The value (Integer, String, Float and other Generic types).
-
- **Example**
-
- Gets the first 10 numbers:
-
- ``` sql
- SELECT groupArraySorted(10)(number) FROM numbers(100)
- ```
-
- ``` text
- ┌─groupArraySorted(10)(number)─┐
- │ [0,1,2,3,4,5,6,7,8,9]        │
- └──────────────────────────────┘
- ```
-
-
- Gets all the String implementations of all numbers in column:
-
- ``` sql
-SELECT groupArraySorted(str) FROM (SELECT toString(number) as str FROM numbers(5));
-
- ```
-
- ``` text
- ┌─groupArraySorted(str)────────┐
- │ ['0','1','2','3','4']        │
- └──────────────────────────────┘
- ```
- 
\ No newline at end of file
diff --git a/docs/en/sql-reference/aggregate-functions/reference/index.md b/docs/en/sql-reference/aggregate-functions/reference/index.md
index 3bf0e070cae..b1f2c5bacbb 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/index.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/index.md
@@ -54,7 +54,6 @@ ClickHouse-specific aggregate functions:
 - [groupArrayMovingAvg](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingavg.md)
 - [groupArrayMovingSum](/docs/en/sql-reference/aggregate-functions/reference/grouparraymovingsum.md)
 - [groupArraySample](./grouparraysample.md)
-- [groupArraySorted](/docs/en/sql-reference/aggregate-functions/reference/grouparraysorted.md)
 - [groupBitAnd](/docs/en/sql-reference/aggregate-functions/reference/groupbitand.md)
 - [groupBitOr](/docs/en/sql-reference/aggregate-functions/reference/groupbitor.md)
 - [groupBitXor](/docs/en/sql-reference/aggregate-functions/reference/groupbitxor.md)
diff --git a/docs/en/sql-reference/aggregate-functions/reference/sparkbar.md b/docs/en/sql-reference/aggregate-functions/reference/sparkbar.md
index e21dad5b2f5..62edc221858 100644
--- a/docs/en/sql-reference/aggregate-functions/reference/sparkbar.md
+++ b/docs/en/sql-reference/aggregate-functions/reference/sparkbar.md
@@ -1,62 +1,64 @@
----
-slug: /en/sql-reference/aggregate-functions/reference/sparkbar
-sidebar_position: 311
-sidebar_label: sparkbar
----
-
-# sparkbar
-
-The function plots a frequency histogram for values `x` and the repetition rate `y` of these values over the interval `[min_x, max_x]`.
-Repetitions for all `x` falling into the same bucket are averaged, so data should be pre-aggregated.
-Negative repetitions are ignored.
-
-If no interval is specified, then the minimum `x` is used as the interval start, and the maximum `x` — as the interval end.
-Otherwise, values outside the interval are ignored.
-
-**Syntax**
-
-``` sql
-sparkbar(buckets[, min_x, max_x])(x, y)
-```
-
-**Parameters**
-
-- `buckets` — The number of segments. Type: [Integer](../../../sql-reference/data-types/int-uint.md).
-- `min_x` — The interval start. Optional parameter.
-- `max_x` — The interval end. Optional parameter.
-
-**Arguments**
-
-- `x` — The field with values.
-- `y` — The field with the frequency of values.
-
-**Returned value**
-
-- The frequency histogram.
-
-**Example**
-
-Query:
-
-``` sql
-CREATE TABLE spark_bar_data (`value` Int64, `event_date` Date) ENGINE = MergeTree ORDER BY event_date;
-
-INSERT INTO spark_bar_data VALUES (1,'2020-01-01'), (3,'2020-01-02'), (4,'2020-01-02'), (-3,'2020-01-02'), (5,'2020-01-03'), (2,'2020-01-04'), (3,'2020-01-05'), (7,'2020-01-06'), (6,'2020-01-07'), (8,'2020-01-08'), (2,'2020-01-11');
-
-SELECT sparkbar(9)(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
-
-SELECT sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
-```
-
-Result:
-
-``` text
-┌─sparkbar(9)(event_date, cnt)─┐
-│ ▂▅▂▃▆█  ▂                    │
-└──────────────────────────────┘
-
-┌─sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date, cnt)─┐
-│ ▂▅▂▃▇▆█                                                                  │
-└──────────────────────────────────────────────────────────────────────────┘
-```
-
+---
+slug: /en/sql-reference/aggregate-functions/reference/sparkbar
+sidebar_position: 311
+sidebar_label: sparkbar
+---
+
+# sparkbar
+
+The function plots a frequency histogram for values `x` and the repetition rate `y` of these values over the interval `[min_x, max_x]`.
+Repetitions for all `x` falling into the same bucket are averaged, so data should be pre-aggregated.
+Negative repetitions are ignored.
+
+If no interval is specified, then the minimum `x` is used as the interval start, and the maximum `x` — as the interval end.
+Otherwise, values outside the interval are ignored.
+
+**Syntax**
+
+``` sql
+sparkbar(buckets[, min_x, max_x])(x, y)
+```
+
+**Parameters**
+
+- `buckets` — The number of segments. Type: [Integer](../../../sql-reference/data-types/int-uint.md).
+- `min_x` — The interval start. Optional parameter.
+- `max_x` — The interval end. Optional parameter.
+
+**Arguments**
+
+- `x` — The field with values.
+- `y` — The field with the frequency of values.
+
+**Returned value**
+
+- The frequency histogram.
+
+**Example**
+
+Query:
+
+``` sql
+CREATE TABLE spark_bar_data (`value` Int64, `event_date` Date) ENGINE = MergeTree ORDER BY event_date;
+
+INSERT INTO spark_bar_data VALUES (1,'2020-01-01'), (3,'2020-01-02'), (4,'2020-01-02'), (-3,'2020-01-02'), (5,'2020-01-03'), (2,'2020-01-04'), (3,'2020-01-05'), (7,'2020-01-06'), (6,'2020-01-07'), (8,'2020-01-08'), (2,'2020-01-11');
+
+SELECT sparkbar(9)(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
+
+SELECT sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
+```
+
+Result:
+
+``` text
+┌─sparkbar(9)(event_date, cnt)─┐
+│ ▂▅▂▃▆█  ▂                    │
+└──────────────────────────────┘
+
+┌─sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date, cnt)─┐
+│ ▂▅▂▃▇▆█                                                                  │
+└──────────────────────────────────────────────────────────────────────────┘
+```
+
+The alias for this function is sparkBar.
+
diff --git a/docs/en/sql-reference/dictionaries/index.md b/docs/en/sql-reference/dictionaries/index.md
index 4f021b25809..9f86aaf2502 100644
--- a/docs/en/sql-reference/dictionaries/index.md
+++ b/docs/en/sql-reference/dictionaries/index.md
@@ -394,7 +394,7 @@ Configuration example:
 or
 
 ``` sql
-LAYOUT(HASHED_ARRAY())
+LAYOUT(HASHED_ARRAY([SHARDS 1]))
 ```
 
 ### complex_key_hashed_array
@@ -412,7 +412,7 @@ Configuration example:
 or
 
 ``` sql
-LAYOUT(COMPLEX_KEY_HASHED_ARRAY())
+LAYOUT(COMPLEX_KEY_HASHED_ARRAY([SHARDS 1]))
 ```
 
 ### range_hashed {#range_hashed}
@@ -2415,8 +2415,8 @@ clickhouse client \
     --secure \
     --password MY_PASSWORD \
     --query "
-    INSERT INTO regexp_dictionary_source_table 
-    SELECT * FROM input ('id UInt64, parent_id UInt64, regexp String, keys Array(String), values Array(String)') 
+    INSERT INTO regexp_dictionary_source_table
+    SELECT * FROM input ('id UInt64, parent_id UInt64, regexp String, keys Array(String), values Array(String)')
     FORMAT CSV" < regexp_dict.csv
 ```
 
diff --git a/docs/en/sql-reference/functions/array-functions.md b/docs/en/sql-reference/functions/array-functions.md
index 00efa63c960..f5da00a8663 100644
--- a/docs/en/sql-reference/functions/array-functions.md
+++ b/docs/en/sql-reference/functions/array-functions.md
@@ -143,7 +143,7 @@ range([start, ] end [, step])
 **Implementation details**
 
 - All arguments `start`, `end`, `step` must be below data types: `UInt8`, `UInt16`, `UInt32`, `UInt64`,`Int8`, `Int16`, `Int32`, `Int64`, as well as elements of the returned array, which's type is a super type of all arguments.
-- An exception is thrown if query results in arrays with a total length of more than number of elements specified by the [function_range_max_elements_in_block](../../operations/settings/settings.md#settings-function_range_max_elements_in_block) setting.
+- An exception is thrown if query results in arrays with a total length of more than number of elements specified by the [function_range_max_elements_in_block](../../operations/settings/settings.md#function_range_max_elements_in_block) setting.
 - Returns Null if any argument has Nullable(Nothing) type. An exception is thrown if any argument has Null value (Nullable(T) type).
 
 **Examples**
diff --git a/docs/en/sql-reference/functions/date-time-functions.md b/docs/en/sql-reference/functions/date-time-functions.md
index 565486275e6..0261589b968 100644
--- a/docs/en/sql-reference/functions/date-time-functions.md
+++ b/docs/en/sql-reference/functions/date-time-functions.md
@@ -1809,6 +1809,8 @@ Alias: `dateTrunc`.
     - `quarter`
     - `year`
 
+    `unit` argument is case-insensitive.
+
 - `value` — Date and time. [DateTime](../../sql-reference/data-types/datetime.md) or [DateTime64](../../sql-reference/data-types/datetime64.md).
 - `timezone` — [Timezone name](../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-timezone) for the returned value (optional). If not specified, the function uses the timezone of the `value` parameter. [String](../../sql-reference/data-types/string.md).
 
diff --git a/docs/en/sql-reference/functions/hash-functions.md b/docs/en/sql-reference/functions/hash-functions.md
index 4816a6f0032..a23849c13aa 100644
--- a/docs/en/sql-reference/functions/hash-functions.md
+++ b/docs/en/sql-reference/functions/hash-functions.md
@@ -319,9 +319,9 @@ This is a relatively fast non-cryptographic hash function of average quality for
 Calculates a 64-bit hash code from any type of integer.
 It works faster than intHash32. Average quality.
 
-## SHA1, SHA224, SHA256, SHA512
+## SHA1, SHA224, SHA256, SHA512, SHA512_256
 
-Calculates SHA-1, SHA-224, SHA-256, SHA-512 hash from a string and returns the resulting set of bytes as [FixedString](/docs/en/sql-reference/data-types/fixedstring.md).
+Calculates SHA-1, SHA-224, SHA-256, SHA-512, SHA-512-256 hash from a string and returns the resulting set of bytes as [FixedString](/docs/en/sql-reference/data-types/fixedstring.md).
 
 **Syntax**
 
@@ -1780,12 +1780,11 @@ Result:
 ## sqid
 
 Transforms numbers into YouTube-like short URL hash called [Sqid](https://sqids.org/).
-To use this function, set setting `allow_experimental_hash_functions = 1`.
 
 **Syntax**
 
 ```sql
-sqid(number1,...)
+sqid(number1, ...)
 ```
 
 **Arguments**
diff --git a/docs/en/sql-reference/functions/introspection.md b/docs/en/sql-reference/functions/introspection.md
index 8cb35483555..1025b8bdc3d 100644
--- a/docs/en/sql-reference/functions/introspection.md
+++ b/docs/en/sql-reference/functions/introspection.md
@@ -16,7 +16,7 @@ For proper operation of introspection functions:
 
 - Install the `clickhouse-common-static-dbg` package.
 
-- Set the [allow_introspection_functions](../../operations/settings/settings.md#settings-allow_introspection_functions) setting to 1.
+- Set the [allow_introspection_functions](../../operations/settings/settings.md#allow_introspection_functions) setting to 1.
 
         For security reasons introspection functions are disabled by default.
 
diff --git a/docs/en/sql-reference/functions/ip-address-functions.md b/docs/en/sql-reference/functions/ip-address-functions.md
index 33c788a632e..be20e02d77e 100644
--- a/docs/en/sql-reference/functions/ip-address-functions.md
+++ b/docs/en/sql-reference/functions/ip-address-functions.md
@@ -501,41 +501,3 @@ Result:
 │                                                                  0 │
 └────────────────────────────────────────────────────────────────────┘
 ```
-
-## reverseDNSQuery
-
-Performs a reverse DNS query to get the PTR records associated with the IP address.
-
-**Syntax**
-
-``` sql
-reverseDNSQuery(address)
-```
-
-This function performs reverse DNS resolutions on both IPv4 and IPv6.
-
-**Arguments**
-
-- `address` — An IPv4 or IPv6 address. [String](../../sql-reference/data-types/string.md).
-
-**Returned value**
-
-- Associated domains (PTR records).
-
-Type: Type: [Array(String)](../../sql-reference/data-types/array.md).
-
-**Example**
-
-Query:
-
-``` sql
-SELECT reverseDNSQuery('192.168.0.2');
-```
-
-Result:
-
-``` text
-┌─reverseDNSQuery('192.168.0.2')────────────┐
-│ ['test2.example.com','test3.example.com'] │
-└───────────────────────────────────────────┘
-```
diff --git a/docs/en/sql-reference/functions/other-functions.md b/docs/en/sql-reference/functions/other-functions.md
index b2a1d5066bb..35f9c7af2ce 100644
--- a/docs/en/sql-reference/functions/other-functions.md
+++ b/docs/en/sql-reference/functions/other-functions.md
@@ -67,45 +67,7 @@ WHERE macro = 'test';
 │ test  │ Value        │
 └───────┴──────────────┘
 ```
-  
-## getClientHTTPHeader  
-Returns the value of specified http header.If there is no such header or the request method is not http, it will throw an exception.  
 
-**Syntax**  
-
-```sql
-getClientHTTPHeader(name);
-``` 
-
-**Arguments**  
-
-- `name` — HTTP header name .[String](../../sql-reference/data-types/string.md#string)  
-
-**Returned value**
-
-Value of the specified header.  
-Type:[String](../../sql-reference/data-types/string.md#string).
-
-
-When we use `clickhouse-client` to execute this function, we'll always get empty string, because client doesn't use http protocol.
-```sql
-SELECT getCientHTTPHeader('test')
-```
-result:  
-
-```text
-┌─getClientHTTPHeader('test')─┐
-│                             │
-└────────────------───────────┘
-```  
-Try to use http request:  
-```shell 
-echo "select getClientHTTPHeader('X-Clickhouse-User')" | curl -H 'X-ClickHouse-User: default' -H 'X-ClickHouse-Key: ' 'http://localhost:8123/' -d @-
-
-#result
-default
-```
-  
 ## FQDN
 
 Returns the fully qualified domain name of the ClickHouse server.
@@ -666,6 +628,8 @@ SELECT
     formatReadableSize(filesize_bytes) AS filesize
 ```
 
+Alias: `FORMAT_BYTES`.
+
 ``` text
 ┌─filesize_bytes─┬─filesize───┐
 │              1 │ 1.00 B     │
@@ -2867,3 +2831,92 @@ Result:
 │ SELECT a, b FROM tab WHERE (a > 3) AND (b < 3)                          │
 └─────────────────────────────────────────────────────────────────────────┘
 ```
+
+## minSampleSizeConversion
+
+Calculates minimum required sample size for an A/B test comparing conversions (proportions) in two samples.
+
+**Syntax**
+
+``` sql
+minSampleSizeConversion(baseline, mde, power, alpha)
+```
+
+Uses the formula described in [this article](https://towardsdatascience.com/required-sample-size-for-a-b-testing-6f6608dd330a). Assumes equal sizes of treatment and control groups. Returns the sample size required for one group (i.e. the sample size required for the whole experiment is twice the returned value).
+
+**Arguments**
+
+- `baseline` — Baseline conversion. [Float](../data-types/float.md).
+- `mde` — Minimum detectable effect (MDE) as percentage points (e.g. for a baseline conversion 0.25 the MDE 0.03 means an expected change to 0.25 ± 0.03). [Float](../data-types/float.md).
+- `power` — Required statistical power of a test (1 - probability of Type II error). [Float](../data-types/float.md).
+- `alpha` — Required significance level of a test (probability of Type I error). [Float](../data-types/float.md).
+
+**Returned value**
+
+A named [Tuple](../data-types/tuple.md) with 3 elements:
+
+- `"minimum_sample_size"` — Required sample size. [Float64](../data-types/float.md).
+- `"detect_range_lower"` — Lower bound of the range of values not detectable with the returned required sample size (i.e. all values less than or equal to `"detect_range_lower"` are detectable with the provided `alpha` and `power`). Calculated as `baseline - mde`. [Float64](../data-types/float.md).
+- `"detect_range_upper"` — Upper bound of the range of values not detectable with the returned required sample size (i.e. all values greater than or equal to `"detect_range_upper"` are detectable with the provided `alpha` and `power`). Calculated as `baseline + mde`. [Float64](../data-types/float.md).
+
+**Example**
+
+The following query calculates the required sample size for an A/B test with baseline conversion of 25%, MDE of 3%, significance level of 5%, and the desired statistical power of 80%:
+
+``` sql
+SELECT minSampleSizeConversion(0.25, 0.03, 0.80, 0.05) AS sample_size;
+```
+
+Result:
+
+``` text
+┌─sample_size───────────────────┐
+│ (3396.077603219163,0.22,0.28) │
+└───────────────────────────────┘
+```
+
+## minSampleSizeContinuous
+
+Calculates minimum required sample size for an A/B test comparing means of a continuous metric in two samples.
+
+**Syntax**
+
+``` sql
+minSampleSizeContinous(baseline, sigma, mde, power, alpha)
+```
+
+Alias: `minSampleSizeContinous`
+
+Uses the formula described in [this article](https://towardsdatascience.com/required-sample-size-for-a-b-testing-6f6608dd330a). Assumes equal sizes of treatment and control groups. Returns the required sample size for one group (i.e. the sample size required for the whole experiment is twice the returned value). Also assumes equal variance of the test metric in treatment and control groups.
+
+**Arguments**
+
+- `baseline` — Baseline value of a metric. [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
+- `sigma` — Baseline standard deviation of a metric. [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
+- `mde` — Minimum detectable effect (MDE) as percentage of the baseline value (e.g. for a baseline value 112.25 the MDE 0.03 means an expected change to 112.25 ± 112.25*0.03). [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
+- `power` — Required statistical power of a test (1 - probability of Type II error). [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
+- `alpha` — Required significance level of a test (probability of Type I error). [Integer](../data-types/int-uint.md) or [Float](../data-types/float.md).
+
+**Returned value**
+
+A named [Tuple](../data-types/tuple.md) with 3 elements:
+
+- `"minimum_sample_size"` — Required sample size. [Float64](../data-types/float.md).
+- `"detect_range_lower"` — Lower bound of the range of values not detectable with the returned required sample size (i.e. all values less than or equal to `"detect_range_lower"` are detectable with the provided `alpha` and `power`). Calculated as `baseline * (1 - mde)`. [Float64](../data-types/float.md).
+- `"detect_range_upper"` — Upper bound of the range of values not detectable with the returned required sample size (i.e. all values greater than or equal to `"detect_range_upper"` are detectable with the provided `alpha` and `power`). Calculated as `baseline * (1 + mde)`. [Float64](../data-types/float.md).
+
+**Example**
+
+The following query calculates the required sample size for an A/B test on a metric with baseline value of 112.25, standard deviation of 21.1, MDE of 3%, significance level of 5%, and the desired statistical power of 80%:
+
+``` sql
+SELECT minSampleSizeContinous(112.25, 21.1, 0.03, 0.80, 0.05) AS sample_size;
+```
+
+Result:
+
+``` text
+┌─sample_size───────────────────────────┐
+│ (616.2931945826209,108.8825,115.6175) │
+└───────────────────────────────────────┘
+```
diff --git a/docs/en/sql-reference/functions/string-functions.md b/docs/en/sql-reference/functions/string-functions.md
index 1940993ce0b..20694211912 100644
--- a/docs/en/sql-reference/functions/string-functions.md
+++ b/docs/en/sql-reference/functions/string-functions.md
@@ -393,40 +393,6 @@ Reverses the sequence of bytes in a string.
 
 Reverses a sequence of Unicode code points in a string. Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
 
-## format
-
-Format the `pattern` string with the strings listed in the arguments, similar to formatting in Python. The pattern string can contain replacement fields surrounded by curly braces `{}`. Anything not contained in braces is considered literal text and copied verbatim into the output. Literal brace character can be escaped by two braces: `{{ '{{' }}` and `{{ '}}' }}`. Field names can be numbers (starting from zero) or empty (then they are implicitly given monotonically increasing numbers).
-
-**Syntax**
-
-```sql
-format(pattern, s0, s1, …)
-```
-
-**Example**
-
-``` sql
-SELECT format('{1} {0} {1}', 'World', 'Hello')
-```
-
-```result
-┌─format('{1} {0} {1}', 'World', 'Hello')─┐
-│ Hello World Hello                       │
-└─────────────────────────────────────────┘
-```
-
-With implicit numbers:
-
-``` sql
-SELECT format('{} {}', 'Hello', 'World')
-```
-
-```result
-┌─format('{} {}', 'Hello', 'World')─┐
-│ Hello World                       │
-└───────────────────────────────────┘
-```
-
 ## concat
 
 Concatenates the given arguments.
@@ -567,8 +533,8 @@ Result:
 
 ```result
 ┌─concatWithSeparator('a', '1', '2', '3', '4')─┐
-│ 1a2a3a4                           │
-└───────────────────────────────────┘
+│ 1a2a3a4                                      │
+└──────────────────────────────────────────────┘
 ```
 
 ## concatWithSeparatorAssumeInjective
@@ -577,26 +543,52 @@ Like `concatWithSeparator` but assumes that `concatWithSeparator(sep, expr1, exp
 
 A function is called injective if it returns for different arguments different results. In other words: different arguments never produce identical result.
 
-## substring(s, offset, length)
+## substring
 
-Returns a substring with `length` many bytes, starting at the byte at index `offset`. Character indexing starts from 1.
+Returns the substring of a string `s` which starts at the specified byte index `offset`. Byte counting starts from 1. If `offset` is 0, an empty string is returned. If `offset` is negative, the substring starts `pos` characters from the end of the string, rather than from the beginning. An optional argument `length` specifies the maximum number of bytes the returned substring may have.
 
 **Syntax**
 
 ```sql
-substring(s, offset, length)
+substring(s, offset[, length])
 ```
 
 Alias:
 - `substr`
 - `mid`
 
+**Arguments**
+
+- `s` — The string to calculate a substring from. [String](../../sql-reference/data-types/string.md), [FixedString](../../sql-reference/data-types/fixedstring.md) or [Enum](../../sql-reference/data-types/enum.md)
+- `offset` — The starting position of the substring in `s` . [(U)Int*](../../sql-reference/data-types/int-uint.md).
+- `length` — The maximum length of the substring. [(U)Int*](../../sql-reference/data-types/int-uint.md). Optional.
+
+**Returned value**
+
+A substring of `s` with `length` many bytes, starting at index `offset`.
+
+Type: `String`.
+
+**Example**
+
+``` sql
+SELECT 'database' AS db, substr(db, 5), substr(db, 5, 1)
+```
+
+Result:
+
+```result
+┌─db───────┬─substring('database', 5)─┬─substring('database', 5, 1)─┐
+│ database │ base                     │ b                           │
+└──────────┴──────────────────────────┴─────────────────────────────┘
+```
+
 ## substringUTF8
 
 Like `substring` but for Unicode code points. Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
 
 
-## substringIndex(s, delim, count)
+## substringIndex
 
 Returns the substring of `s` before `count` occurrences of the delimiter `delim`, as in Spark or MySQL.
 
@@ -627,7 +619,7 @@ Result:
 └──────────────────────────────────────────────┘
 ```
 
-## substringIndexUTF8(s, delim, count)
+## substringIndexUTF8
 
 Like `substringIndex` but for Unicode code points. Assumes that the string contains valid UTF-8 encoded text. If this assumption is violated, no exception is thrown and the result is undefined.
 
@@ -1259,7 +1251,7 @@ This function also replaces numeric character references with Unicode characters
 **Syntax**
 
 ``` sql
-decodeHTMComponent(x)
+decodeHTMLComponent(x)
 ```
 
 **Arguments**
@@ -1276,7 +1268,7 @@ Type: [String](../../sql-reference/data-types/string.md).
 
 ``` sql
 SELECT decodeHTMLComponent(''CH');
-SELECT decodeHMLComponent('I&heartsuit;ClickHouse');
+SELECT decodeHTMLComponent('I&heartsuit;ClickHouse');
 ```
 
 Result:
diff --git a/docs/en/sql-reference/functions/string-replace-functions.md b/docs/en/sql-reference/functions/string-replace-functions.md
index 74d5d747193..c7bd16cad4a 100644
--- a/docs/en/sql-reference/functions/string-replace-functions.md
+++ b/docs/en/sql-reference/functions/string-replace-functions.md
@@ -132,6 +132,40 @@ For more information, see [RE2](https://github.com/google/re2/blob/master/re2/re
 regexpQuoteMeta(s)
 ```
 
+## format
+
+Format the `pattern` string with the values (strings, integers, etc.) listed in the arguments, similar to formatting in Python. The pattern string can contain replacement fields surrounded by curly braces `{}`. Anything not contained in braces is considered literal text and copied verbatim into the output. Literal brace character can be escaped by two braces: `{{ '{{' }}` and `{{ '}}' }}`. Field names can be numbers (starting from zero) or empty (then they are implicitly given monotonically increasing numbers).
+
+**Syntax**
+
+```sql
+format(pattern, s0, s1, …)
+```
+
+**Example**
+
+``` sql
+SELECT format('{1} {0} {1}', 'World', 'Hello')
+```
+
+```result
+┌─format('{1} {0} {1}', 'World', 'Hello')─┐
+│ Hello World Hello                       │
+└─────────────────────────────────────────┘
+```
+
+With implicit numbers:
+
+``` sql
+SELECT format('{} {}', 'Hello', 'World')
+```
+
+```result
+┌─format('{} {}', 'Hello', 'World')─┐
+│ Hello World                       │
+└───────────────────────────────────┘
+```
+
 ## translate
 
 Replaces characters in the string `s` using a one-to-one character mapping defined by `from` and `to` strings. `from` and `to` must be constant ASCII strings of the same size. Non-ASCII characters in the original string are not modified.
diff --git a/docs/en/sql-reference/functions/time-series-functions.md b/docs/en/sql-reference/functions/time-series-functions.md
index e183fdcdcd7..434432baa48 100644
--- a/docs/en/sql-reference/functions/time-series-functions.md
+++ b/docs/en/sql-reference/functions/time-series-functions.md
@@ -11,8 +11,7 @@ Below functions are used for time series analysis.
 ## seriesPeriodDetectFFT
 
 Finds the period of the given time series data using FFT
-Detect Period in time series data using FFT.
-FFT - Fast Fourier transform (https://en.wikipedia.org/wiki/Fast_Fourier_transform)
+FFT - [Fast Fourier transform](https://en.wikipedia.org/wiki/Fast_Fourier_transform)
 
 **Syntax**
 
@@ -27,6 +26,7 @@ seriesPeriodDetectFFT(series);
 **Returned value**
 
 - A real value equal to the period of time series
+- Returns NAN when number of data points are less than four.
 
 Type: [Float64](../../sql-reference/data-types/float.md).
 
@@ -45,3 +45,15 @@ Result:
 │                      3 │
 └────────────────────────┘
 ```
+
+``` sql
+SELECT seriesPeriodDetectFFT(arrayMap(x -> abs((x % 6) - 3), range(1000))) AS print_0;
+```
+
+Result:
+
+``` text
+┌─print_0─┐
+│       6 │
+└─────────┘
+```
diff --git a/docs/en/sql-reference/statements/alter/apply-deleted-mask.md b/docs/en/sql-reference/statements/alter/apply-deleted-mask.md
new file mode 100644
index 00000000000..7a11d66e739
--- /dev/null
+++ b/docs/en/sql-reference/statements/alter/apply-deleted-mask.md
@@ -0,0 +1,22 @@
+---
+slug: /en/sql-reference/statements/alter/apply-deleted-mask
+sidebar_position: 46
+sidebar_label: APPLY DELETED MASK
+---
+
+# Apply mask of deleted rows
+
+``` sql
+ALTER TABLE [db].name [ON CLUSTER cluster] APPLY DELETED MASK [IN PARTITION partition_id]
+```
+
+The command applies mask created by [lightweight delete](/docs/en/sql-reference/statements/delete) and forcefully removes rows marked as deleted from disk. This command is a heavyweight mutation and it semantically equals to query ```ALTER TABLE [db].name DELETE WHERE _row_exists = 0```.
+
+:::note
+It only works for tables in the [`MergeTree`](../../../engines/table-engines/mergetree-family/mergetree.md) family (including [replicated](../../../engines/table-engines/mergetree-family/replication.md) tables).
+:::
+
+**See also**
+
+- [Lightweight deletes](/docs/en/sql-reference/statements/delete)
+- [Heavyweight deletes](/docs/en/sql-reference/statements/alter/delete.md)
diff --git a/docs/en/sql-reference/statements/alter/index.md b/docs/en/sql-reference/statements/alter/index.md
index d28542e0a43..dc6668c7983 100644
--- a/docs/en/sql-reference/statements/alter/index.md
+++ b/docs/en/sql-reference/statements/alter/index.md
@@ -17,8 +17,9 @@ Most `ALTER TABLE` queries modify table settings or data:
 - [CONSTRAINT](/docs/en/sql-reference/statements/alter/constraint.md)
 - [TTL](/docs/en/sql-reference/statements/alter/ttl.md)
 - [STATISTIC](/docs/en/sql-reference/statements/alter/statistic.md)
+- [APPLY DELETED MASK](/docs/en/sql-reference/statements/alter/apply-deleted-mask.md)
 
-:::note    
+:::note
 Most `ALTER TABLE` queries are supported only for [\*MergeTree](/docs/en/engines/table-engines/mergetree-family/index.md) tables, as well as [Merge](/docs/en/engines/table-engines/special/merge.md) and [Distributed](/docs/en/engines/table-engines/special/distributed.md).
 :::
 
@@ -59,7 +60,7 @@ For all `ALTER` queries, you can use the [alter_sync](/docs/en/operations/settin
 
 You can specify how long (in seconds) to wait for inactive replicas to execute all `ALTER` queries with the [replication_wait_for_inactive_replica_timeout](/docs/en/operations/settings/settings.md/#replication-wait-for-inactive-replica-timeout) setting.
 
-:::note    
+:::note
 For all `ALTER` queries, if `alter_sync = 2` and some replicas are not active for more than the time, specified in the `replication_wait_for_inactive_replica_timeout` setting, then an exception `UNFINISHED` is thrown.
 :::
 
diff --git a/docs/en/sql-reference/statements/alter/view.md b/docs/en/sql-reference/statements/alter/view.md
index 5c5bf0355f6..517e64e3e5b 100644
--- a/docs/en/sql-reference/statements/alter/view.md
+++ b/docs/en/sql-reference/statements/alter/view.md
@@ -6,28 +6,28 @@ sidebar_label: VIEW
 
 # ALTER TABLE … MODIFY QUERY Statement
 
-You can modify `SELECT` query that was specified when a [materialized view](../create/view.md#materialized) was created with the `ALTER TABLE … MODIFY QUERY` statement without interrupting ingestion process. 
+You can modify `SELECT` query that was specified when a [materialized view](../create/view.md#materialized) was created with the `ALTER TABLE … MODIFY QUERY` statement without interrupting ingestion process.
 
-The `allow_experimental_alter_materialized_view_structure` setting must be enabled. 
+The `allow_experimental_alter_materialized_view_structure` setting must be enabled.
 
 This command is created to change materialized view created with `TO [db.]name` clause. It does not change the structure of the underling storage table and it does not change the columns' definition of the materialized view, because of this the application of this command is very limited for materialized views are created without `TO [db.]name` clause.
 
 **Example with TO table**
 
 ```sql
-CREATE TABLE events (ts DateTime, event_type String) 
+CREATE TABLE events (ts DateTime, event_type String)
 ENGINE = MergeTree ORDER BY (event_type, ts);
 
-CREATE TABLE events_by_day (ts DateTime, event_type String, events_cnt UInt64) 
+CREATE TABLE events_by_day (ts DateTime, event_type String, events_cnt UInt64)
 ENGINE = SummingMergeTree ORDER BY (event_type, ts);
 
-CREATE MATERIALIZED VIEW mv TO events_by_day AS 
+CREATE MATERIALIZED VIEW mv TO events_by_day AS
 SELECT toStartOfDay(ts) ts, event_type, count() events_cnt
 FROM events
-GROUP BY ts, event_type; 
+GROUP BY ts, event_type;
 
-INSERT INTO events 
-SELECT Date '2020-01-01' + interval number * 900 second, 
+INSERT INTO events
+SELECT Date '2020-01-01' + interval number * 900 second,
        ['imp', 'click'][number%2+1]
 FROM numbers(100);
 
@@ -43,23 +43,23 @@ ORDER BY ts, event_type;
 │ 2020-01-02 00:00:00 │ imp        │               2 │
 └─────────────────────┴────────────┴─────────────────┘
 
--- Let's add the new measurment `cost` 
+-- Let's add the new measurment `cost`
 -- and the new dimension `browser`.
 
-ALTER TABLE events 
+ALTER TABLE events
   ADD COLUMN browser String,
   ADD COLUMN cost Float64;
 
 -- Column do not have to match in a materialized view and TO
 -- (destination table), so the next alter does not break insertion.
 
-ALTER TABLE events_by_day 
+ALTER TABLE events_by_day
     ADD COLUMN cost Float64,
     ADD COLUMN browser String after event_type,
     MODIFY ORDER BY (event_type, ts, browser);
 
-INSERT INTO events 
-SELECT Date '2020-01-02' + interval number * 900 second, 
+INSERT INTO events
+SELECT Date '2020-01-02' + interval number * 900 second,
        ['imp', 'click'][number%2+1],
        ['firefox', 'safary', 'chrome'][number%3+1],
        10/(number+1)%33
@@ -82,16 +82,16 @@ ORDER BY ts, event_type;
 └─────────────────────┴────────────┴─────────┴────────────┴──────┘
 
 SET allow_experimental_alter_materialized_view_structure=1;
-  
-ALTER TABLE mv MODIFY QUERY 
+
+ALTER TABLE mv MODIFY QUERY
   SELECT toStartOfDay(ts) ts, event_type, browser,
   count() events_cnt,
   sum(cost) cost
   FROM events
   GROUP BY ts, event_type, browser;
 
-INSERT INTO events 
-SELECT Date '2020-01-03' + interval number * 900 second, 
+INSERT INTO events
+SELECT Date '2020-01-03' + interval number * 900 second,
        ['imp', 'click'][number%2+1],
        ['firefox', 'safary', 'chrome'][number%3+1],
        10/(number+1)%33
@@ -138,7 +138,7 @@ PRIMARY KEY (event_type, ts)
 ORDER BY (event_type, ts, browser)
 SETTINGS index_granularity = 8192
 
--- !!! The columns' definition is unchanged but it does not matter, we are not quering 
+-- !!! The columns' definition is unchanged but it does not matter, we are not quering
 -- MATERIALIZED VIEW, we are quering TO (storage) table.
 -- SELECT section is updated.
 
@@ -169,7 +169,7 @@ The application is very limited because you can only change the `SELECT` section
 
 ```sql
 CREATE TABLE src_table (`a` UInt32) ENGINE = MergeTree ORDER BY a;
-CREATE MATERIALIZED VIEW mv (`a` UInt32) ENGINE = MergeTree ORDER BY a AS SELECT a FROM src_table; 
+CREATE MATERIALIZED VIEW mv (`a` UInt32) ENGINE = MergeTree ORDER BY a AS SELECT a FROM src_table;
 INSERT INTO src_table (a) VALUES (1), (2);
 SELECT * FROM mv;
 ```
@@ -199,3 +199,7 @@ SELECT * FROM mv;
 ## ALTER LIVE VIEW Statement
 
 `ALTER LIVE VIEW ... REFRESH` statement refreshes a [Live view](../create/view.md#live-view). See [Force Live View Refresh](../create/view.md#live-view-alter-refresh).
+
+## ALTER TABLE … MODIFY REFRESH Statement
+
+`ALTER TABLE ... MODIFY REFRESH` statement changes refresh parameters of a [Refreshable Materialized View](../create/view.md#refreshable-materialized-view). See [Changing Refresh Parameters](../create/view.md#changing-refresh-parameters).
diff --git a/docs/en/sql-reference/statements/create/view.md b/docs/en/sql-reference/statements/create/view.md
index 2a8d6788889..f6158acd9a4 100644
--- a/docs/en/sql-reference/statements/create/view.md
+++ b/docs/en/sql-reference/statements/create/view.md
@@ -37,6 +37,7 @@ SELECT a, b, c FROM (SELECT ...)
 ```
 
 ## Parameterized View
+
 Parametrized views are similar to normal views, but can be created with parameters which are not resolved immediately. These views can be used with table functions, which specify the name of the view as function name and the parameter values as its arguments.
 
 ``` sql
@@ -66,7 +67,7 @@ When creating a materialized view with `TO [db].[table]`, you can't also use `PO
 
 A materialized view is implemented as follows: when inserting data to the table specified in `SELECT`, part of the inserted data is converted by this `SELECT` query, and the result is inserted in the view.
 
-:::note    
+:::note
 Materialized views in ClickHouse use **column names** instead of column order during insertion into destination table. If some column names are not present in the `SELECT` query result, ClickHouse uses a default value, even if the column is not [Nullable](../../data-types/nullable.md). A safe practice would be to add aliases for every column when using Materialized views.
 
 Materialized views in ClickHouse are implemented more like insert triggers. If there’s some aggregation in the view query, it’s applied only to the batch of freshly inserted data. Any changes to existing data of source table (like update, delete, drop partition, etc.) does not change the materialized view.
@@ -90,156 +91,122 @@ Views look the same as normal tables. For example, they are listed in the result
 
 To delete a view, use [DROP VIEW](../../../sql-reference/statements/drop.md#drop-view). Although `DROP TABLE` works for VIEWs as well.
 
-## Live View [Experimental]
+## Live View [Deprecated]
 
-:::note    
-This is an experimental feature that may change in backwards-incompatible ways in the future releases. Enable usage of live views and `WATCH` query using [allow_experimental_live_view](../../../operations/settings/settings.md#allow-experimental-live-view) setting. Input the command `set allow_experimental_live_view = 1`.
+This feature is deprecated and will be removed in the future.
+
+For your convenience, the old documentation is located [here](https://pastila.nl/?00f32652/fdf07272a7b54bda7e13b919264e449f.md)
+
+## Refreshable Materialized View {#refreshable-materialized-view}
+
+```sql
+CREATE MATERIALIZED VIEW [IF NOT EXISTS] [db.]table_name
+REFRESH EVERY|AFTER interval [OFFSET interval]
+RANDOMIZE FOR interval
+DEPENDS ON [db.]name [, [db.]name [, ...]]
+[TO[db.]name] [(columns)] [ENGINE = engine] [EMPTY]
+AS SELECT ...
+```
+where `interval` is a sequence of simple intervals:
+```sql
+number SECOND|MINUTE|HOUR|DAY|WEEK|MONTH|YEAR
+```
+
+Periodically runs the corresponding query and stores its result in a table, atomically replacing the table's previous contents.
+
+Differences from regular non-refreshable materialized views:
+ * No insert trigger. I.e. when new data is inserted into the table specified in SELECT, it's *not* automatically pushed to the refreshable materialized view. The periodic refresh runs the entire query and replaces the entire table.
+ * No restrictions on the SELECT query. Table functions (e.g. `url()`), views, UNION, JOIN, are all allowed.
+
+:::note
+Refreshable materialized views are a work in progress. Setting `allow_experimental_refreshable_materialized_view = 1` is required for creating one. Current limitations:
+ * not compatible with Replicated database or table engines,
+ * require [Atomic database engine](../../../engines/database-engines/atomic.md),
+ * no retries for failed refresh - we just skip to the next scheduled refresh time,
+ * no limit on number of concurrent refreshes.
 :::
 
+### Refresh Schedule
+
+Example refresh schedules:
 ```sql
-CREATE LIVE VIEW [IF NOT EXISTS] [db.]table_name [WITH REFRESH [value_in_sec]] AS SELECT ...
+REFRESH EVERY 1 DAY -- every day, at midnight (UTC)
+REFRESH EVERY 1 MONTH -- on 1st day of every month, at midnight
+REFRESH EVERY 1 MONTH OFFSET 5 DAY 2 HOUR -- on 6th day of every month, at 2:00 am
+REFRESH EVERY 2 WEEK OFFSET 5 DAY 15 HOUR 10 MINUTE -- every other Saturday, at 3:10 pm
+REFRESH EVERY 30 MINUTE -- at 00:00, 00:30, 01:00, 01:30, etc
+REFRESH AFTER 30 MINUTE -- 30 minutes after the previous refresh completes, no alignment with time of day
+-- REFRESH AFTER 1 HOUR OFFSET 1 MINUTE -- syntax errror, OFFSET is not allowed with AFTER
 ```
 
-Live views store result of the corresponding [SELECT](../../../sql-reference/statements/select/index.md) query and are updated any time the result of the query changes. Query result as well as partial result needed to combine with new data are stored in memory providing increased performance for repeated queries. Live views can provide push notifications when query result changes using the [WATCH](../../../sql-reference/statements/watch.md) query.
+`RANDOMIZE FOR` randomly adjusts the time of each refresh, e.g.:
+```sql
+REFRESH EVERY 1 DAY OFFSET 2 HOUR RANDOMIZE FOR 1 HOUR -- every day at random time between 01:30 and 02:30
+```
 
-Live views are triggered by insert into the innermost table specified in the query.
+At most one refresh may be running at a time, for a given view. E.g. if a view with `REFRESH EVERY 1 MINUTE` takes 2 minutes to refresh, it'll just be refreshing every 2 minutes. If it then becomes faster and starts refreshing in 10 seconds, it'll go back to refreshing every minute. (In particular, it won't refresh every 10 seconds to catch up with a backlog of missed refreshes - there's no such backlog.)
 
-Live views work similarly to how a query in a distributed table works. But instead of combining partial results from different servers they combine partial result from current data with partial result from the new data. When a live view query includes a subquery then the cached partial result is only stored for the innermost subquery.
+Additionally, a refresh is started immediately after the materialized view is created, unless `EMPTY` is specified in the `CREATE` query. If `EMPTY` is specified, the first refresh happens according to schedule.
 
-:::info    
-- [Table function](../../../sql-reference/table-functions/index.md) is not supported as the innermost table.
-- Tables that do not have inserts such as a [dictionary](../../../sql-reference/dictionaries/index.md), [system table](../../../operations/system-tables/index.md), a [normal view](#normal), or a [materialized view](#materialized) will not trigger a live view.
-- Only queries where one can combine partial result from the old data plus partial result from the new data will work. Live view will not work for queries that require the complete data set to compute the final result or aggregations where the state of the aggregation must be preserved.
-- Does not work with replicated or distributed tables where inserts are performed on different nodes.
-- Can't be triggered by multiple tables.
+### Dependencies {#refresh-dependencies}
 
-See [WITH REFRESH](#live-view-with-refresh) to force periodic updates of a live view that in some cases can be used as a workaround.
+`DEPENDS ON` synchronizes refreshes of different tables. By way of example, suppose there's a chain of two refreshable materialized views:
+```sql
+CREATE MATERIALIZED VIEW source REFRESH EVERY 1 DAY AS SELECT * FROM url(...)
+CREATE MATERIALIZED VIEW destination REFRESH EVERY 1 DAY AS SELECT ... FROM source
+```
+Without `DEPENDS ON`, both views will start a refresh at midnight, and `destination` typically will see yesterday's data in `source`. If we add dependency:
+```
+CREATE MATERIALIZED VIEW destination REFRESH EVERY 1 DAY DEPENDS ON source AS SELECT ... FROM source
+```
+then `destination`'s refresh will start only after `source`'s refresh finished for that day, so `destination` will be based on fresh data.
+
+Alternatively, the same result can be achieved with:
+```
+CREATE MATERIALIZED VIEW destination REFRESH AFTER 1 HOUR DEPENDS ON source AS SELECT ... FROM source
+```
+where `1 HOUR` can be any duration less than `source`'s refresh period. The dependent table won't be refreshed more frequently than any of its dependencies. This is a valid way to set up a chain of refreshable views without specifying the real refresh period more than once.
+
+A few more examples:
+ * `REFRESH EVERY 1 DAY OFFSET 10 MINUTE` (`destination`) depends on `REFRESH EVERY 1 DAY` (`source`)<br/>
+   If `source` refresh takes more than 10 minutes, `destination` will wait for it.
+ * `REFRESH EVERY 1 DAY OFFSET 1 HOUR` depends on `REFRESH EVERY 1 DAY OFFSET 23 HOUR`<br/>
+   Similar to the above, even though the corresponding refreshes happen on different calendar days.
+   `destination`'s refresh on day X+1 will wait for `source`'s refresh on day X (if it takes more than 2 hours).
+ * `REFRESH EVERY 2 HOUR` depends on `REFRESH EVERY 1 HOUR`<br/>
+   The 2 HOUR refresh happens after the 1 HOUR refresh for every other hour, e.g. after the midnight
+   refresh, then after the 2am refresh, etc.
+ * `REFRESH EVERY 1 MINUTE` depends on `REFRESH EVERY 2 HOUR`<br/>
+   `REFRESH AFTER 1 MINUTE` depends on `REFRESH EVERY 2 HOUR`<br/>
+   `REFRESH AFTER 1 MINUTE` depends on `REFRESH AFTER 2 HOUR`<br/>
+   `destination` is refreshed once after every `source` refresh, i.e. every 2 hours. The `1 MINUTE` is effectively ignored.
+ * `REFRESH AFTER 1 HOUR` depends on `REFRESH AFTER 1 HOUR`<br/>
+   Currently this is not recommended.
+
+:::note
+`DEPENDS ON` only works between refreshable materialized views. Listing a regular table in the `DEPENDS ON` list will prevent the view from ever refreshing (dependencies can be removed with `ALTER`, see below).
 :::
 
-### Monitoring Live View Changes
+### Changing Refresh Parameters {#changing-refresh-parameters}
 
-You can monitor changes in the `LIVE VIEW` query result using [WATCH](../../../sql-reference/statements/watch.md) query.
-
-```sql
-WATCH [db.]live_view
+To change refresh parameters:
+```
+ALTER TABLE [db.]name MODIFY REFRESH EVERY|AFTER ... [RANDOMIZE FOR ...] [DEPENDS ON ...]
 ```
 
-**Example:**
+:::note
+This replaces refresh schedule *and* dependencies. If the table had a `DEPENDS ON`, doing a `MODIFY REFRESH` without `DEPENDS ON` will remove the dependencies.
+:::
 
-```sql
-CREATE TABLE mt (x Int8) Engine = MergeTree ORDER BY x;
-CREATE LIVE VIEW lv AS SELECT sum(x) FROM mt;
-```
-Watch a live view while doing a parallel insert into the source table.
+### Other operations
 
-```sql
-WATCH lv;
-```
+The status of all refreshable materialized views is available in table [`system.view_refreshes`](../../../operations/system-tables/view_refreshes.md). In particular, it contains refresh progress (if running), last and next refresh time, exception message if a refresh failed.
 
-```bash
-┌─sum(x)─┬─_version─┐
-│      1 │        1 │
-└────────┴──────────┘
-┌─sum(x)─┬─_version─┐
-│      3 │        2 │
-└────────┴──────────┘
-┌─sum(x)─┬─_version─┐
-│      6 │        3 │
-└────────┴──────────┘
-```
-
-```sql
-INSERT INTO mt VALUES (1);
-INSERT INTO mt VALUES (2);
-INSERT INTO mt VALUES (3);
-```
-
-Or add [EVENTS](../../../sql-reference/statements/watch.md#events-clause) clause to just get change events.
-
-```sql
-WATCH [db.]live_view EVENTS;
-```
-
-**Example:**
-
-```sql
-WATCH lv EVENTS;
-```
-
-```bash
-┌─version─┐
-│       1 │
-└─────────┘
-┌─version─┐
-│       2 │
-└─────────┘
-┌─version─┐
-│       3 │
-└─────────┘
-```
-
-You can execute [SELECT](../../../sql-reference/statements/select/index.md) query on a live view in the same way as for any regular view or a table. If the query result is cached it will return the result immediately without running the stored query on the underlying tables.
-
-```sql
-SELECT * FROM [db.]live_view WHERE ...
-```
-
-### Force Live View Refresh
-
-You can force live view refresh using the `ALTER LIVE VIEW [db.]table_name REFRESH` statement.
-
-### WITH REFRESH Clause
-
-When a live view is created with a `WITH REFRESH` clause then it will be automatically refreshed after the specified number of seconds elapse since the last refresh or trigger.
-
-```sql
-CREATE LIVE VIEW [db.]table_name WITH REFRESH [value_in_sec] AS SELECT ...
-```
-
-If the refresh value is not specified then the value specified by the [periodic_live_view_refresh](../../../operations/settings/settings.md#periodic-live-view-refresh) setting is used.
-
-**Example:**
-
-```sql
-CREATE LIVE VIEW lv WITH REFRESH 5 AS SELECT now();
-WATCH lv
-```
-
-```bash
-┌───────────────now()─┬─_version─┐
-│ 2021-02-21 08:47:05 │        1 │
-└─────────────────────┴──────────┘
-┌───────────────now()─┬─_version─┐
-│ 2021-02-21 08:47:10 │        2 │
-└─────────────────────┴──────────┘
-┌───────────────now()─┬─_version─┐
-│ 2021-02-21 08:47:15 │        3 │
-└─────────────────────┴──────────┘
-```
-
-```sql
-WATCH lv
-```
-
-```
-Code: 60. DB::Exception: Received from localhost:9000. DB::Exception: Table default.lv does not exist..
-```
-
-### Live View Usage
-
-Most common uses of live view tables include:
-
-- Providing push notifications for query result changes to avoid polling.
-- Caching results of most frequent queries to provide immediate query results.
-- Watching for table changes and triggering a follow-up select queries.
-- Watching metrics from system tables using periodic refresh.
-
-**See Also**
-- [ALTER LIVE VIEW](../alter/view.md#alter-live-view)
+To manually stop, start, trigger, or cancel refreshes use [`SYSTEM STOP|START|REFRESH|CANCEL VIEW`](../system.md#refreshable-materialized-views).
 
 ## Window View [Experimental]
 
-:::info    
+:::info
 This is an experimental feature that may change in backwards-incompatible ways in the future releases. Enable usage of window views and `WATCH` query using [allow_experimental_window_view](../../../operations/settings/settings.md#allow-experimental-window-view) setting. Input the command `set allow_experimental_window_view = 1`.
 :::
 
diff --git a/docs/en/sql-reference/statements/insert-into.md b/docs/en/sql-reference/statements/insert-into.md
index e0cc98c2351..f9d93305071 100644
--- a/docs/en/sql-reference/statements/insert-into.md
+++ b/docs/en/sql-reference/statements/insert-into.md
@@ -11,7 +11,7 @@ Inserts data into a table.
 **Syntax**
 
 ``` sql
-INSERT INTO [TABLE] [db.]table [(c1, c2, c3)] VALUES (v11, v12, v13), (v21, v22, v23), ...
+INSERT INTO [TABLE] [db.]table [(c1, c2, c3)] [SETTINGS ...] VALUES (v11, v12, v13), (v21, v22, v23), ...
 ```
 
 You can specify a list of columns to insert using  the `(c1, c2, c3)`. You can also use an expression with column [matcher](../../sql-reference/statements/select/index.md#asterisk) such as `*` and/or [modifiers](../../sql-reference/statements/select/index.md#select-modifiers) such as [APPLY](../../sql-reference/statements/select/index.md#apply-modifier), [EXCEPT](../../sql-reference/statements/select/index.md#except-modifier), [REPLACE](../../sql-reference/statements/select/index.md#replace-modifier).
@@ -126,7 +126,7 @@ To insert a default value instead of `NULL` into a column with not nullable data
 **Syntax**
 
 ``` sql
-INSERT INTO [TABLE] [db.]table [(c1, c2, c3)] FROM INFILE file_name [COMPRESSION type] FORMAT format_name
+INSERT INTO [TABLE] [db.]table [(c1, c2, c3)] FROM INFILE file_name [COMPRESSION type] [SETTINGS ...] [FORMAT format_name]
 ```
 
 Use the syntax above to insert data from a file, or files, stored on the **client** side. `file_name` and `type` are string literals. Input file [format](../../interfaces/formats.md) must be set in the `FORMAT` clause.
diff --git a/docs/en/sql-reference/statements/optimize.md b/docs/en/sql-reference/statements/optimize.md
index 07b5a196096..b5fc0a23745 100644
--- a/docs/en/sql-reference/statements/optimize.md
+++ b/docs/en/sql-reference/statements/optimize.md
@@ -17,7 +17,7 @@ This query tries to initialize an unscheduled merge of data parts for tables. No
 OPTIMIZE TABLE [db.]name [ON CLUSTER cluster] [PARTITION partition | PARTITION ID 'partition_id'] [FINAL] [DEDUPLICATE [BY expression]]
 ```
 
-The `OPTIMIZE` query is supported for [MergeTree](../../engines/table-engines/mergetree-family/mergetree.md) family, the [MaterializedView](../../engines/table-engines/special/materializedview.md) and the [Buffer](../../engines/table-engines/special/buffer.md) engines. Other table engines aren’t supported.
+The `OPTIMIZE` query is supported for [MergeTree](../../engines/table-engines/mergetree-family/mergetree.md) family (including [materialized views](../../sql-reference/statements/create/view.md#materialized-view)) and the [Buffer](../../engines/table-engines/special/buffer.md) engines. Other table engines aren’t supported.
 
 When `OPTIMIZE` is used with the [ReplicatedMergeTree](../../engines/table-engines/mergetree-family/replication.md) family of table engines, ClickHouse creates a task for merging and waits for execution on all replicas (if the [alter_sync](../../operations/settings/settings.md#alter-sync) setting is set to `2`) or on current replica (if the [alter_sync](../../operations/settings/settings.md#alter-sync) setting is set to `1`).
 
diff --git a/docs/en/sql-reference/statements/select/from.md b/docs/en/sql-reference/statements/select/from.md
index a4f449ad321..06742ff74e2 100644
--- a/docs/en/sql-reference/statements/select/from.md
+++ b/docs/en/sql-reference/statements/select/from.md
@@ -34,7 +34,7 @@ Queries that use `FINAL` are executed slightly slower than similar queries that
 - Data is merged during query execution.
 - Queries with `FINAL` read primary key columns in addition to the columns specified in the query.
 
-**In most cases, avoid using `FINAL`.** The common approach is to use different queries that assume the background processes of the `MergeTree` engine haven’t happened yet and deal with it by applying aggregation (for example, to discard duplicates).
+`FINAL` requires additional compute and memory resources, as the processing that normally would occur at merge time must occur in memory at the time of the query. However, using FINAL is sometimes necessary in order to produce accurate results, and is less expensive than running `OPTIMIZE` to force a merge. It is also sometimes possible to use different queries that assume the background processes of the `MergeTree` engine haven’t happened yet and deal with it by applying aggregation (for example, to discard duplicates). If you need to use FINAL in your queries in order to get the required results, then it is okay to do so but be aware of the additional processing required.
 
 `FINAL` can be applied automatically using [FINAL](../../../operations/settings/settings.md#final) setting to all tables in a query using a session or a user profile.
 
diff --git a/docs/en/sql-reference/statements/select/into-outfile.md b/docs/en/sql-reference/statements/select/into-outfile.md
index 352af16042a..5b7196f13e3 100644
--- a/docs/en/sql-reference/statements/select/into-outfile.md
+++ b/docs/en/sql-reference/statements/select/into-outfile.md
@@ -12,7 +12,7 @@ Compressed files are supported. Compression type is detected by the extension of
 **Syntax**
 
 ```sql
-SELECT <expr_list> INTO OUTFILE file_name [AND STDOUT] [APPEND] [COMPRESSION type [LEVEL level]]
+SELECT <expr_list> INTO OUTFILE file_name [AND STDOUT] [APPEND | TRUNCATE] [COMPRESSION type [LEVEL level]]
 ```
 
 `file_name` and `type` are string literals. Supported compression types are: `'none'`, `'gzip'`, `'deflate'`, `'br'`, `'xz'`, `'zstd'`, `'lz4'`, `'bz2'`.
@@ -26,6 +26,7 @@ SELECT <expr_list> INTO OUTFILE file_name [AND STDOUT] [APPEND] [COMPRESSION typ
 - The default [output format](../../../interfaces/formats.md) is `TabSeparated` (like in the command-line client batch mode). Use [FORMAT](format.md) clause to change it.
 - If `AND STDOUT` is mentioned in the query then the output that is written to the file is also displayed on standard output. If used with compression, the plaintext is displayed on standard output.
 - If `APPEND` is mentioned in the query then the output is appended to an existing file. If compression is used, append cannot be used.
+- When writing to a file that already exists, `APPEND` or `TRUNCATE` must be used.
 
 **Example**
 
diff --git a/docs/en/sql-reference/statements/select/join.md b/docs/en/sql-reference/statements/select/join.md
index 281a1d0436c..0529be06b5d 100644
--- a/docs/en/sql-reference/statements/select/join.md
+++ b/docs/en/sql-reference/statements/select/join.md
@@ -43,22 +43,23 @@ Additional join types available in ClickHouse:
 - `LEFT ANTI JOIN` and `RIGHT ANTI JOIN`, a blacklist on “join keys”, without producing a cartesian product.
 - `LEFT ANY JOIN`, `RIGHT ANY JOIN` and `INNER ANY JOIN`, partially (for opposite side of `LEFT` and `RIGHT`) or completely (for `INNER` and `FULL`) disables the cartesian product for standard `JOIN` types.
 - `ASOF JOIN` and `LEFT ASOF JOIN`, joining sequences with a non-exact match. `ASOF JOIN` usage is described below.
+- `PASTE JOIN`, performs a horizontal concatenation of two tables.
 
 :::note
-When [join_algorithm](../../../operations/settings/settings.md#settings-join_algorithm) is set to `partial_merge`, `RIGHT JOIN` and `FULL JOIN` are supported only with `ALL` strictness (`SEMI`, `ANTI`, `ANY`, and `ASOF` are not supported).
+When [join_algorithm](../../../operations/settings/settings.md#join_algorithm) is set to `partial_merge`, `RIGHT JOIN` and `FULL JOIN` are supported only with `ALL` strictness (`SEMI`, `ANTI`, `ANY`, and `ASOF` are not supported).
 :::
 
 ## Settings
 
-The default join type can be overridden using [join_default_strictness](../../../operations/settings/settings.md#settings-join_default_strictness) setting.
+The default join type can be overridden using [join_default_strictness](../../../operations/settings/settings.md#join_default_strictness) setting.
 
 The behavior of ClickHouse server for `ANY JOIN` operations depends on the [any_join_distinct_right_table_keys](../../../operations/settings/settings.md#any_join_distinct_right_table_keys) setting.
 
 
 **See also**
 
-- [join_algorithm](../../../operations/settings/settings.md#settings-join_algorithm)
-- [join_any_take_last_row](../../../operations/settings/settings.md#settings-join_any_take_last_row)
+- [join_algorithm](../../../operations/settings/settings.md#join_algorithm)
+- [join_any_take_last_row](../../../operations/settings/settings.md#join_any_take_last_row)
 - [join_use_nulls](../../../operations/settings/settings.md#join_use_nulls)
 - [partial_merge_join_optimizations](../../../operations/settings/settings.md#partial_merge_join_optimizations)
 - [partial_merge_join_rows_in_right_blocks](../../../operations/settings/settings.md#partial_merge_join_rows_in_right_blocks)
@@ -269,6 +270,33 @@ For example, consider the following tables:
 `ASOF` join is **not** supported in the [Join](../../../engines/table-engines/special/join.md) table engine.
 :::
 
+## PASTE JOIN Usage
+
+The result of `PASTE JOIN` is a table that contains all columns from left subquery followed by all columns from the right subquery.
+The rows are matched based on their positions in the original tables (the order of rows should be defined). 
+If the subqueries return a different number of rows, extra rows will be cut.
+
+Example:
+```SQL
+SELECT *
+FROM
+(
+    SELECT number AS a
+    FROM numbers(2)
+) AS t1
+PASTE JOIN
+(
+    SELECT number AS a
+    FROM numbers(2)
+    ORDER BY a DESC
+) AS t2
+
+┌─a─┬─t2.a─┐
+│ 0 │    1 │
+│ 1 │    0 │
+└───┴──────┘
+```
+
 ## Distributed JOIN
 
 There are two ways to execute join involving distributed tables:
@@ -352,7 +380,7 @@ If you need a `JOIN` for joining with dimension tables (these are relatively sma
 
 ### Memory Limitations
 
-By default, ClickHouse uses the [hash join](https://en.wikipedia.org/wiki/Hash_join) algorithm. ClickHouse takes the right_table and creates a hash table for it in RAM. If `join_algorithm = 'auto'` is enabled, then after some threshold of memory consumption, ClickHouse falls back to [merge](https://en.wikipedia.org/wiki/Sort-merge_join) join algorithm. For `JOIN` algorithms description see the [join_algorithm](../../../operations/settings/settings.md#settings-join_algorithm) setting.
+By default, ClickHouse uses the [hash join](https://en.wikipedia.org/wiki/Hash_join) algorithm. ClickHouse takes the right_table and creates a hash table for it in RAM. If `join_algorithm = 'auto'` is enabled, then after some threshold of memory consumption, ClickHouse falls back to [merge](https://en.wikipedia.org/wiki/Sort-merge_join) join algorithm. For `JOIN` algorithms description see the [join_algorithm](../../../operations/settings/settings.md#join_algorithm) setting.
 
 If you need to restrict `JOIN` operation memory consumption use the following settings:
 
diff --git a/docs/en/sql-reference/statements/select/order-by.md b/docs/en/sql-reference/statements/select/order-by.md
index 53bdc9041a1..d6432a7b4f8 100644
--- a/docs/en/sql-reference/statements/select/order-by.md
+++ b/docs/en/sql-reference/statements/select/order-by.md
@@ -5,12 +5,22 @@ sidebar_label: ORDER BY
 
 # ORDER BY Clause
 
-The `ORDER BY` clause contains a list of expressions, which can each be attributed with `DESC` (descending) or `ASC` (ascending) modifier which determine the sorting direction. If the direction is not specified, `ASC` is assumed, so it’s usually omitted. The sorting direction applies to a single expression, not to the entire list. Example: `ORDER BY Visits DESC, SearchPhrase`.  Sorting is case-sensitive.
+The `ORDER BY` clause contains
 
-If you want to sort by column numbers instead of column names, enable the setting [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments).
+- a list of expressions, e.g. `ORDER BY visits, search_phrase`,
+- a list of numbers referring to columns in the `SELECT` clause, e.g. `ORDER BY 2, 1`, or
+- `ALL` which means all columns of the `SELECT` clause, e.g. `ORDER BY ALL`.
 
-Rows that have identical values for the list of sorting expressions are output in an arbitrary order, which can also be non-deterministic (different each time).
-If the ORDER BY clause is omitted, the order of the rows is also undefined, and may be non-deterministic as well.
+To disable sorting by column numbers, set setting [enable_positional_arguments](../../../operations/settings/settings.md#enable-positional-arguments) = 0.
+To disable sorting by `ALL`, set setting [enable_order_by_all](../../../operations/settings/settings.md#enable-order-by-all) = 0.
+
+The `ORDER BY` clause can be attributed by a `DESC` (descending) or `ASC` (ascending) modifier which determines the sorting direction.
+Unless an explicit sort order is specified, `ASC` is used by default.
+The sorting direction applies to a single expression, not to the entire list, e.g. `ORDER BY Visits DESC, SearchPhrase`.
+Also, sorting is performed case-sensitively.
+
+Rows with identical values for a sort expressions are returned in an arbitrary and non-deterministic order.
+If the `ORDER BY` clause is omitted in a `SELECT` statement, the row order is also arbitrary and non-deterministic.
 
 ## Sorting of Special Values
 
@@ -265,8 +275,9 @@ Consider disabling `optimize_read_in_order` manually, when running queries that
 
 Optimization is supported in the following table engines:
 
-- [MergeTree](../../../engines/table-engines/mergetree-family/mergetree.md)
-- [Merge](../../../engines/table-engines/special/merge.md), [Buffer](../../../engines/table-engines/special/buffer.md), and [MaterializedView](../../../engines/table-engines/special/materializedview.md) table engines over `MergeTree`-engine tables
+- [MergeTree](../../../engines/table-engines/mergetree-family/mergetree.md) (including [materialized views](../../../sql-reference/statements/create/view.md#materialized-view)),
+- [Merge](../../../engines/table-engines/special/merge.md),
+- [Buffer](../../../engines/table-engines/special/buffer.md)
 
 In `MaterializedView`-engine tables the optimization works with views like `SELECT ... FROM merge_tree_table ORDER BY pk`. But it is not supported in the queries like `SELECT ... FROM view ORDER BY pk` if the view query does not have the `ORDER BY` clause.
 
diff --git a/docs/en/sql-reference/statements/system.md b/docs/en/sql-reference/statements/system.md
index 177a8283f38..0fdbbeac235 100644
--- a/docs/en/sql-reference/statements/system.md
+++ b/docs/en/sql-reference/statements/system.md
@@ -150,7 +150,7 @@ SYSTEM RELOAD CONFIG [ON CLUSTER cluster_name]
 
 ## RELOAD USERS
 
-Reloads all access storages, including: users.xml, local disk access storage, replicated (in ZooKeeper) access storage. 
+Reloads all access storages, including: users.xml, local disk access storage, replicated (in ZooKeeper) access storage.
 
 ```sql
 SYSTEM RELOAD USERS [ON CLUSTER cluster_name]
@@ -354,7 +354,7 @@ After running this statement the `[db.]replicated_merge_tree_family_table_name`
 
 ### SYNC DATABASE REPLICA
 
-Waits until the specified [replicated database](https://clickhouse.com/docs/en/engines/database-engines/replicated) applies all schema changes from the DDL queue of that database. 
+Waits until the specified [replicated database](https://clickhouse.com/docs/en/engines/database-engines/replicated) applies all schema changes from the DDL queue of that database.
 
 **Syntax**
 ```sql
@@ -449,14 +449,14 @@ SYSTEM SYNC FILE CACHE [ON CLUSTER cluster_name]
 ```
 
 
-### SYSTEM STOP LISTEN
+## SYSTEM STOP LISTEN
 
-Closes the socket and gracefully terminates the existing connections to the server on the specified port with the specified protocol. 
+Closes the socket and gracefully terminates the existing connections to the server on the specified port with the specified protocol.
 
 However, if the corresponding protocol settings were not specified in the clickhouse-server configuration, this command will have no effect.
 
 ```sql
-SYSTEM STOP LISTEN [ON CLUSTER cluster_name] [QUERIES ALL | QUERIES DEFAULT | QUERIES CUSTOM | TCP | TCP_WITH_PROXY | TCP_SECURE | HTTP | HTTPS | MYSQL | GRPC | POSTGRESQL | PROMETHEUS | CUSTOM 'protocol']
+SYSTEM STOP LISTEN [ON CLUSTER cluster_name] [QUERIES ALL | QUERIES DEFAULT | QUERIES CUSTOM | TCP | TCP WITH PROXY | TCP SECURE | HTTP | HTTPS | MYSQL | GRPC | POSTGRESQL | PROMETHEUS | CUSTOM 'protocol']
 ```
 
 - If `CUSTOM 'protocol'` modifier is specified, the custom protocol with the specified name defined in the protocols section of the server configuration will be stopped.
@@ -464,12 +464,56 @@ SYSTEM STOP LISTEN [ON CLUSTER cluster_name] [QUERIES ALL | QUERIES DEFAULT | QU
 - If `QUERIES DEFAULT [EXCEPT .. [,..]]` modifier is specified, all default protocols are stopped, unless specified with `EXCEPT` clause.
 - If `QUERIES CUSTOM [EXCEPT .. [,..]]` modifier is specified, all custom protocols are stopped, unless specified with `EXCEPT` clause.
 
-### SYSTEM START LISTEN
+## SYSTEM START LISTEN
 
 Allows new connections to be established on the specified protocols.
 
 However, if the server on the specified port and protocol was not stopped using the SYSTEM STOP LISTEN command, this command will have no effect.
 
 ```sql
-SYSTEM START LISTEN [ON CLUSTER cluster_name] [QUERIES ALL | QUERIES DEFAULT | QUERIES CUSTOM | TCP | TCP_WITH_PROXY | TCP_SECURE | HTTP | HTTPS | MYSQL | GRPC | POSTGRESQL | PROMETHEUS | CUSTOM 'protocol']
+SYSTEM START LISTEN [ON CLUSTER cluster_name] [QUERIES ALL | QUERIES DEFAULT | QUERIES CUSTOM | TCP | TCP WITH PROXY | TCP SECURE | HTTP | HTTPS | MYSQL | GRPC | POSTGRESQL | PROMETHEUS | CUSTOM 'protocol']
+```
+
+## Managing Refreshable Materialized Views {#refreshable-materialized-views}
+
+Commands to control background tasks performed by [Refreshable Materialized Views](../../sql-reference/statements/create/view.md#refreshable-materialized-view)
+
+Keep an eye on [`system.view_refreshes`](../../operations/system-tables/view_refreshes.md) while using them.
+
+### SYSTEM REFRESH VIEW
+
+Trigger an immediate out-of-schedule refresh of a given view.
+
+```sql
+SYSTEM REFRESH VIEW [db.]name
+```
+
+### SYSTEM STOP VIEW, SYSTEM STOP VIEWS
+
+Disable periodic refreshing of the given view or all refreshable views. If a refresh is in progress, cancel it too.
+
+```sql
+SYSTEM STOP VIEW [db.]name
+```
+```sql
+SYSTEM STOP VIEWS
+```
+
+### SYSTEM START VIEW, SYSTEM START VIEWS
+
+Enable periodic refreshing for the given view or all refreshable views. No immediate refresh is triggered.
+
+```sql
+SYSTEM START VIEW [db.]name
+```
+```sql
+SYSTEM START VIEWS
+```
+
+### SYSTEM CANCEL VIEW
+
+If there's a refresh in progress for the given view, interrupt and cancel it. Otherwise do nothing.
+
+```sql
+SYSTEM CANCEL VIEW [db.]name
 ```
diff --git a/docs/en/sql-reference/syntax.md b/docs/en/sql-reference/syntax.md
index f5651c2dcb6..6dcb3e75e48 100644
--- a/docs/en/sql-reference/syntax.md
+++ b/docs/en/sql-reference/syntax.md
@@ -16,7 +16,7 @@ INSERT INTO t VALUES (1, 'Hello, world'), (2, 'abc'), (3, 'def')
 
 The `INSERT INTO t VALUES` fragment is parsed by the full parser, and the data `(1, 'Hello, world'), (2, 'abc'), (3, 'def')` is parsed by the fast stream parser. You can also turn on the full parser for the data by using the [input_format_values_interpret_expressions](../operations/settings/settings-formats.md#input_format_values_interpret_expressions) setting. When `input_format_values_interpret_expressions = 1`, ClickHouse first tries to parse values with the fast stream parser. If it fails, ClickHouse tries to use the full parser for the data, treating it like an SQL [expression](#expressions).
 
-Data can have any format. When a query is received, the server calculates no more than [max_query_size](../operations/settings/settings.md#settings-max_query_size) bytes of the request in RAM (by default, 1 MB), and the rest is stream parsed.
+Data can have any format. When a query is received, the server calculates no more than [max_query_size](../operations/settings/settings.md#max_query_size) bytes of the request in RAM (by default, 1 MB), and the rest is stream parsed.
 It allows for avoiding issues with large `INSERT` queries.
 
 When using the `Values` format in an `INSERT` query, it may seem that data is parsed the same as expressions in a `SELECT` query, but this is not true. The `Values` format is much more limited.
diff --git a/docs/en/sql-reference/table-functions/cluster.md b/docs/en/sql-reference/table-functions/cluster.md
index a083c6b89a6..ad92ab39183 100644
--- a/docs/en/sql-reference/table-functions/cluster.md
+++ b/docs/en/sql-reference/table-functions/cluster.md
@@ -55,5 +55,5 @@ Connection settings like `host`, `port`, `user`, `password`, `compression`, `sec
 
 **See Also**
 
-- [skip_unavailable_shards](../../operations/settings/settings.md#settings-skip_unavailable_shards)
-- [load_balancing](../../operations/settings/settings.md#settings-load_balancing)
+- [skip_unavailable_shards](../../operations/settings/settings.md#skip_unavailable_shards)
+- [load_balancing](../../operations/settings/settings.md#load_balancing)
diff --git a/docs/en/sql-reference/table-functions/file.md b/docs/en/sql-reference/table-functions/file.md
index ad1feb87c60..3a63811add6 100644
--- a/docs/en/sql-reference/table-functions/file.md
+++ b/docs/en/sql-reference/table-functions/file.md
@@ -1,4 +1,4 @@
- --
+---
 slug: /en/sql-reference/table-functions/file
 sidebar_position: 60
 sidebar_label: file
@@ -128,17 +128,17 @@ Reading data from `table.csv`, located in `archive1.zip` or/and `archive2.zip`:
 SELECT * FROM file('user_files/archives/archive{1..2}.zip :: table.csv');
 ```
 
-## Globbing {#globs_in_path}
+## Globs in path {#globs_in_path}
 
 Paths may use globbing. Files must match the whole path pattern, not only the suffix or prefix.
 
 - `*` — Represents arbitrarily many characters except `/` but including the empty string.
 - `?` — Represents an arbitrary single character.
-- `{some_string,another_string,yet_another_one}` — Represents any of alternative strings `'some_string', 'another_string', 'yet_another_one'`. The strings may contain `/`.
+- `{some_string,another_string,yet_another_one}` — Substitutes any of strings `'some_string', 'another_string', 'yet_another_one'`. The strings can contain the `/` symbol.
 - `{N..M}` — Represents any number `>= N` and `<= M`.
 - `**` - Represents all files inside a folder recursively.
 
-Constructions with `{}` are similar to the [remote](remote.md) table function.
+Constructions with `{}` are similar to the [remote](remote.md) and [hdfs](hdfs.md) table functions.
 
 **Example**
 
@@ -199,11 +199,11 @@ SELECT count(*) FROM file('big_dir/**/file002', 'CSV', 'name String, value UInt3
 
 ## Settings {#settings}
 
-- [engine_file_empty_if_not_exists](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - allows to select empty data from a file that doesn't exist. Disabled by default.
+- [engine_file_empty_if_not_exists](/docs/en/operations/settings/settings.md#engine-file-empty_if-not-exists) - allows to select empty data from a file that doesn't exist. Disabled by default.
 - [engine_file_truncate_on_insert](/docs/en/operations/settings/settings.md#engine-file-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
 - [engine_file_allow_create_multiple_files](/docs/en/operations/settings/settings.md#engine_file_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
 - [engine_file_skip_empty_files](/docs/en/operations/settings/settings.md#engine_file_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
-- [storage_file_read_method](/docs/en/operations/settings/settings.md#engine-file-emptyif-not-exists) - method of reading data from storage file, one of: read, pread, mmap (only for clickhouse-local). Default value: `pread` for clickhouse-server, `mmap` for clickhouse-local.
+- [storage_file_read_method](/docs/en/operations/settings/settings.md#engine-file-empty_if-not-exists) - method of reading data from storage file, one of: read, pread, mmap (only for clickhouse-local). Default value: `pread` for clickhouse-server, `mmap` for clickhouse-local.
 
 
 **See Also**
diff --git a/docs/en/sql-reference/table-functions/fileCluster.md b/docs/en/sql-reference/table-functions/fileCluster.md
index 22ca132f136..2646250311c 100644
--- a/docs/en/sql-reference/table-functions/fileCluster.md
+++ b/docs/en/sql-reference/table-functions/fileCluster.md
@@ -45,7 +45,7 @@ $ cat /var/lib/clickhouse/user_files/test1.csv
     1,"file1"
     11,"file11"
 
-$ cat /var/lib/clickhouse/user_files/test1.csv
+$ cat /var/lib/clickhouse/user_files/test2.csv
     2,"file2"
     22,"file22"
 ```
diff --git a/docs/en/sql-reference/table-functions/fuzzJSON.md b/docs/en/sql-reference/table-functions/fuzzJSON.md
index 74ccb0bcb8a..a64f35691f6 100644
--- a/docs/en/sql-reference/table-functions/fuzzJSON.md
+++ b/docs/en/sql-reference/table-functions/fuzzJSON.md
@@ -19,6 +19,7 @@ fuzzJSON({ named_collection [option=value [,..]] | json_str[, random_seed] })
  - `json_str` (String) - The source string representing structured data in JSON format.
  - `random_seed` (UInt64) - Manual random seed for producing stable results.
  - `reuse_output` (boolean) - Reuse the output from a fuzzing process as input for the next fuzzer.
+ - `malform_output` (boolean) - Generate a string that cannot be parsed as a JSON object.
  - `max_output_length` (UInt64) - Maximum allowable length of the generated or perturbed JSON string.
  - `probability` (Float64) - The probability to fuzz a JSON field (a key-value pair). Must be within [0, 1] range.
  - `max_nesting_level` (UInt64) - The maximum allowed depth of nested structures within the JSON data.
@@ -84,3 +85,13 @@ SELECT * FROM fuzzJSON('{"id":1}', 1234) LIMIT 3;
 {"BRjE":16137826149911306846}
 {"XjKE":15076727133550123563}
 ```
+
+``` sql
+SELECT * FROM fuzzJSON(json_nc, json_str='{"name" : "FuzzJSON"}', random_seed=1337, malform_output=true) LIMIT 3;
+```
+
+``` text
+U"name":"FuzzJSON*"SpByjZKtr2VAyHCO"falseh
+{"name"keFuzzJSON, "g6vVO7TCIk":jTt^
+{"DBhz":YFuzzJSON5}
+```
diff --git a/docs/en/sql-reference/table-functions/hdfs.md b/docs/en/sql-reference/table-functions/hdfs.md
index 31780e30e8e..92f904b8841 100644
--- a/docs/en/sql-reference/table-functions/hdfs.md
+++ b/docs/en/sql-reference/table-functions/hdfs.md
@@ -41,14 +41,14 @@ LIMIT 2
 
 ## Globs in path {#globs_in_path}
 
-Multiple path components can have globs. For being processed file should exists and matches to the whole path pattern (not only suffix or prefix).
+Paths may use globbing. Files must match the whole path pattern, not only the suffix or prefix.
 
-- `*` — Substitutes any number of any characters except `/` including empty string.
-- `?` — Substitutes any single character.
+- `*` — Represents arbitrarily many characters except `/` but including the empty string.
+- `?` — Represents an arbitrary single character.
 - `{some_string,another_string,yet_another_one}` — Substitutes any of strings `'some_string', 'another_string', 'yet_another_one'`. The strings can contain the `/` symbol.
-- `{N..M}` — Substitutes any number in range from N to M including both borders.
+- `{N..M}` — Represents any number `>= N` and `<= M`.
 
-Constructions with `{}` are similar to the [remote](../../sql-reference/table-functions/remote.md)) table function.
+Constructions with `{}` are similar to the [remote](remote.md) and [file](file.md) table functions.
 
 **Example**
 
@@ -100,7 +100,7 @@ FROM hdfs('hdfs://hdfs1:9000/big_dir/file{0..9}{0..9}{0..9}', 'CSV', 'name Strin
 
 ## Storage Settings {#storage-settings}
 
-- [hdfs_truncate_on_insert](/docs/en/operations/settings/settings.md#hdfs-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [hdfs_truncate_on_insert](/docs/en/operations/settings/settings.md#hdfs_truncate_on_insert) - allows to truncate file before insert into it. Disabled by default.
 - [hdfs_create_multiple_files](/docs/en/operations/settings/settings.md#hdfs_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
 - [hdfs_skip_empty_files](/docs/en/operations/settings/settings.md#hdfs_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
 - [ignore_access_denied_multidirectory_globs](/docs/en/operations/settings/settings.md#ignore_access_denied_multidirectory_globs) - allows to ignore permission denied errors for multi-directory globs.
diff --git a/docs/en/sql-reference/table-functions/remote.md b/docs/en/sql-reference/table-functions/remote.md
index 3ca177050d3..228f4a4c7e1 100644
--- a/docs/en/sql-reference/table-functions/remote.md
+++ b/docs/en/sql-reference/table-functions/remote.md
@@ -165,5 +165,5 @@ The following pattern types are supported.
 - `{0n..0m}` - A range of numbers with leading zeroes. This pattern preserves leading zeroes in indices. For instance, `example{01..03}-1` generates `example01-1`, `example02-1` and `example03-1`.
 - `{a|b}` - Any number of variants separated by a `|`. The pattern specifies replicas. For instance, `example01-{1|2}` generates replicas `example01-1` and `example01-2`.
 
-The query will be sent to the first healthy replica. However, for `remote` the replicas are iterated in the order currently set in the [load_balancing](../../operations/settings/settings.md#settings-load_balancing) setting.
+The query will be sent to the first healthy replica. However, for `remote` the replicas are iterated in the order currently set in the [load_balancing](../../operations/settings/settings.md#load_balancing) setting.
 The number of generated addresses is limited by [table_function_remote_max_addresses](../../operations/settings/settings.md#table_function_remote_max_addresses) setting.
diff --git a/docs/en/sql-reference/table-functions/s3.md b/docs/en/sql-reference/table-functions/s3.md
index dc11259c626..8065f066666 100644
--- a/docs/en/sql-reference/table-functions/s3.md
+++ b/docs/en/sql-reference/table-functions/s3.md
@@ -16,7 +16,7 @@ When using the `s3 table function` with [`INSERT INTO...SELECT`](../../sql-refer
 **Syntax**
 
 ``` sql
-s3(path [, NOSIGN | aws_access_key_id, aws_secret_access_key] [,format] [,structure] [,compression])
+s3(path [, NOSIGN | aws_access_key_id, aws_secret_access_key [,session_token]] [,format] [,structure] [,compression])
 ```
 
 :::tip GCS
@@ -38,6 +38,8 @@ For GCS, substitute your HMAC key and HMAC secret where you see `aws_access_key_
   :::
 
 - `NOSIGN` - If this keyword is provided in place of credentials, all the requests will not be signed.
+- `access_key_id`, `secret_access_key` — Keys that specify credentials to use with given endpoint. Optional.
+- `session_token` - Session token to use with the given keys. Optional when passing keys.
 - `format` — The [format](../../interfaces/formats.md#formats) of the file.
 - `structure` — Structure of the table. Format `'column1_name column1_type, column2_name column2_type, ...'`.
 - `compression` — Parameter is optional. Supported values: `none`, `gzip/gz`, `brotli/br`, `xz/LZMA`, `zstd/zst`. By default, it will autodetect compression by file extension.
@@ -236,7 +238,7 @@ LIMIT 5;
 
 ## Storage Settings {#storage-settings}
 
-- [s3_truncate_on_insert](/docs/en/operations/settings/settings.md#s3-truncate-on-insert) - allows to truncate file before insert into it. Disabled by default.
+- [s3_truncate_on_insert](/docs/en/operations/settings/settings.md#s3_truncate_on_insert) - allows to truncate file before insert into it. Disabled by default.
 - [s3_create_multiple_files](/docs/en/operations/settings/settings.md#s3_allow_create_multiple_files) - allows to create a new file on each insert if format has suffix. Disabled by default.
 - [s3_skip_empty_files](/docs/en/operations/settings/settings.md#s3_skip_empty_files) - allows to skip empty files while reading. Disabled by default.
 
diff --git a/docs/en/sql-reference/table-functions/s3Cluster.md b/docs/en/sql-reference/table-functions/s3Cluster.md
index 799eb31446a..080c9860519 100644
--- a/docs/en/sql-reference/table-functions/s3Cluster.md
+++ b/docs/en/sql-reference/table-functions/s3Cluster.md
@@ -10,14 +10,15 @@ Allows processing files from [Amazon S3](https://aws.amazon.com/s3/) and Google
 **Syntax**
 
 ``` sql
-s3Cluster(cluster_name, source, [,access_key_id, secret_access_key] [,format] [,structure])
+s3Cluster(cluster_name, source, [,access_key_id, secret_access_key, [session_token]] [,format] [,structure])
 ```
 
 **Arguments**
 
 - `cluster_name` — Name of a cluster that is used to build a set of addresses and connection parameters to remote and local servers.
 - `source` — URL to a file or a bunch of files. Supports following wildcards in readonly mode: `*`, `**`, `?`, `{'abc','def'}` and `{N..M}` where `N`, `M` — numbers, `abc`, `def` — strings. For more information see [Wildcards In Path](../../engines/table-engines/integrations/s3.md#wildcards-in-path).
-- `access_key_id` and `secret_access_key` — Keys that specify credentials to use with given endpoint. Optional.
+- `access_key_id`, `secret_access_key` — Keys that specify credentials to use with given endpoint. Optional.
+- `session_token` - Session token to use with the given keys. Optional when passing keys.
 - `format` — The [format](../../interfaces/formats.md#formats) of the file.
 - `structure` — Structure of the table. Format `'column1_name column1_type, column2_name column2_type, ...'`.
 
diff --git a/docs/ru/development/style.md b/docs/ru/development/style.md
index 49c4aade4e9..cd1297504af 100644
--- a/docs/ru/development/style.md
+++ b/docs/ru/development/style.md
@@ -493,7 +493,7 @@ catch (const DB::Exception & e)
 
 ``` cpp
 if (0 != close(fd))
-    throwFromErrno("Cannot close file " + file_name, ErrorCodes::CANNOT_CLOSE_FILE);
+    throw ErrnoException(ErrorCodes::CANNOT_CLOSE_FILE, "Cannot close file {}", file_name);
 ```
 
 `assert` не используются.
diff --git a/docs/ru/engines/table-engines/mergetree-family/mergetree.md b/docs/ru/engines/table-engines/mergetree-family/mergetree.md
index 7195ee38af6..9f223157ea7 100644
--- a/docs/ru/engines/table-engines/mergetree-family/mergetree.md
+++ b/docs/ru/engines/table-engines/mergetree-family/mergetree.md
@@ -369,6 +369,9 @@ INDEX b (u64 * length(str), i32 + f64 * 100, date, str) TYPE set(100) GRANULARIT
 | [greaterOrEquals (\>=)](../../../sql-reference/functions/comparison-functions.md#greaterorequals) | ✔           | ✔      | ✗           | ✗           | ✗             |
 | [empty](../../../sql-reference/functions/array-functions.md#function-empty)                                | ✔           | ✔      | ✗           | ✗           | ✗             |
 | [notEmpty](../../../sql-reference/functions/array-functions.md#function-notempty)                          | ✔           | ✔      | ✗           | ✗           | ✗             |
+| [has](../../../sql-reference/functions/array-functions.md#function-has)                                       | ✗           | ✗      | ✔          | ✔          | ✔            | ✔        |
+| [hasAny](../../../sql-reference/functions/array-functions.md#function-hasAny)                                 | ✗           | ✗      | ✔          | ✔          | ✔            | ✗        |
+| [hasAll](../../../sql-reference/functions/array-functions.md#function-hasAll)                                 | ✗           | ✗      | ✗          | ✗          | ✔            | ✗        |
 | hasToken                                                                                                   | ✗           | ✗      | ✗           | ✔           | ✗             |
 
 Функции с постоянным агрументом, который меньше, чем размер ngram не могут использовать индекс `ngrambf_v1` для оптимизации запроса.
@@ -681,7 +684,6 @@ TTL d + INTERVAL 1 MONTH GROUP BY k1, k2 SET x = max(x), y = min(y);
 -   `disk` — диск, находящийся внутри тома.
 -   `max_data_part_size_bytes` — максимальный размер куска данных, который может находиться на любом из дисков этого тома. Если в результате слияния размер куска ожидается больше, чем max_data_part_size_bytes, то этот кусок будет записан в следующий том. В основном эта функция позволяет хранить новые / мелкие куски на горячем (SSD) томе и перемещать их на холодный (HDD) том, когда они достигают большого размера. Не используйте этот параметр, если политика имеет только один том.
 -   `move_factor` — доля доступного свободного места на томе, если места становится меньше, то данные начнут перемещение на следующий том, если он есть (по умолчанию 0.1). Для перемещения куски сортируются по размеру от большего к меньшему (по убыванию) и выбираются куски, совокупный размер которых достаточен для соблюдения условия `move_factor`, если совокупный размер всех партов недостаточен, будут перемещены все парты.
--   `prefer_not_to_merge` — Отключает слияние кусков данных, хранящихся на данном томе. Если данная настройка включена, то слияние данных, хранящихся на данном томе, не допускается. Это позволяет контролировать работу ClickHouse с медленными дисками.
 
 Примеры конфигураций:
 
@@ -718,7 +720,6 @@ TTL d + INTERVAL 1 MONTH GROUP BY k1, k2 SET x = max(x), y = min(y);
                 </main>
                 <external>
                     <disk>external</disk>
-                    <prefer_not_to_merge>true</prefer_not_to_merge>
                 </external>
             </volumes>
         </small_jbod_with_external_no_merges>
diff --git a/docs/ru/getting-started/example-datasets/criteo.md b/docs/ru/getting-started/example-datasets/criteo.md
index 5ba55795632..4818e9e69d4 100644
--- a/docs/ru/getting-started/example-datasets/criteo.md
+++ b/docs/ru/getting-started/example-datasets/criteo.md
@@ -1,14 +1,14 @@
 ---
 slug: /ru/getting-started/example-datasets/criteo
 sidebar_position: 18
-sidebar_label: "Терабайт логов кликов от Criteo"
+sidebar_label: "Терабайтный журнал посещений сайта от Criteo"
 ---
 
-# Терабайт логов кликов от Criteo {#terabait-logov-klikov-ot-criteo}
+# Терабайтный журнал посещений сайта от Criteo {#terabaitnyi-zhurnal}
 
 Скачайте данные с http://labs.criteo.com/downloads/download-terabyte-click-logs/
 
-Создайте таблицу для импорта лога:
+Создайте таблицу для импорта журнала:
 
 ``` sql
 CREATE TABLE criteo_log (date Date, clicked UInt8, int1 Int32, int2 Int32, int3 Int32, int4 Int32, int5 Int32, int6 Int32, int7 Int32, int8 Int32, int9 Int32, int10 Int32, int11 Int32, int12 Int32, int13 Int32, cat1 String, cat2 String, cat3 String, cat4 String, cat5 String, cat6 String, cat7 String, cat8 String, cat9 String, cat10 String, cat11 String, cat12 String, cat13 String, cat14 String, cat15 String, cat16 String, cat17 String, cat18 String, cat19 String, cat20 String, cat21 String, cat22 String, cat23 String, cat24 String, cat25 String, cat26 String) ENGINE = Log
@@ -69,7 +69,7 @@ CREATE TABLE criteo
 ) ENGINE = MergeTree(date, intHash32(icat1), (date, intHash32(icat1)), 8192)
 ```
 
-Преобразуем данные из сырого лога и положим во вторую таблицу:
+Преобразуйте импортированные данные, разложив их по таблице сконвертированных данных:
 
 ``` sql
 INSERT INTO criteo SELECT date, clicked, int1, int2, int3, int4, int5, int6, int7, int8, int9, int10, int11, int12, int13, reinterpretAsUInt32(unhex(cat1)) AS icat1, reinterpretAsUInt32(unhex(cat2)) AS icat2, reinterpretAsUInt32(unhex(cat3)) AS icat3, reinterpretAsUInt32(unhex(cat4)) AS icat4, reinterpretAsUInt32(unhex(cat5)) AS icat5, reinterpretAsUInt32(unhex(cat6)) AS icat6, reinterpretAsUInt32(unhex(cat7)) AS icat7, reinterpretAsUInt32(unhex(cat8)) AS icat8, reinterpretAsUInt32(unhex(cat9)) AS icat9, reinterpretAsUInt32(unhex(cat10)) AS icat10, reinterpretAsUInt32(unhex(cat11)) AS icat11, reinterpretAsUInt32(unhex(cat12)) AS icat12, reinterpretAsUInt32(unhex(cat13)) AS icat13, reinterpretAsUInt32(unhex(cat14)) AS icat14, reinterpretAsUInt32(unhex(cat15)) AS icat15, reinterpretAsUInt32(unhex(cat16)) AS icat16, reinterpretAsUInt32(unhex(cat17)) AS icat17, reinterpretAsUInt32(unhex(cat18)) AS icat18, reinterpretAsUInt32(unhex(cat19)) AS icat19, reinterpretAsUInt32(unhex(cat20)) AS icat20, reinterpretAsUInt32(unhex(cat21)) AS icat21, reinterpretAsUInt32(unhex(cat22)) AS icat22, reinterpretAsUInt32(unhex(cat23)) AS icat23, reinterpretAsUInt32(unhex(cat24)) AS icat24, reinterpretAsUInt32(unhex(cat25)) AS icat25, reinterpretAsUInt32(unhex(cat26)) AS icat26 FROM criteo_log;
diff --git a/docs/ru/getting-started/example-datasets/github-events.mdx b/docs/ru/getting-started/example-datasets/github-events.mdx
index c6e58a9f5a4..84f445074af 100644
--- a/docs/ru/getting-started/example-datasets/github-events.mdx
+++ b/docs/ru/getting-started/example-datasets/github-events.mdx
@@ -1,9 +1,9 @@
 ---
 slug: /ru/getting-started/example-datasets/github-events
 sidebar_label: GitHub Events
-title: "GitHub Events Dataset"
+title: "Набор данных о событиях на GitHub"
 ---
 
-import Content from '@site/docs/en/getting-started/example-datasets/github-events.md';
+Набор данных о событиях на GitHub с 2011 года по 6 декабря 2020 года содержит 3,1 млрд записей. Объём исходных данных — 75 ГБ, для загрузки в Clickhouse потребуется около 200 ГБ свободного пространства хранения (при использовании метода сжатия lz4). 
 
-<Content />
+Полное описание набора, инструкции по загрузке и запросы к нему опубликованы на https://ghe.clickhouse.tech/
diff --git a/docs/ru/operations/settings/settings.md b/docs/ru/operations/settings/settings.md
index e13ddd18030..2081dcc59b6 100644
--- a/docs/ru/operations/settings/settings.md
+++ b/docs/ru/operations/settings/settings.md
@@ -2249,7 +2249,7 @@ SELECT * FROM test_table
 
 ## input_format_parallel_parsing {#input-format-parallel-parsing}
 
-Включает или отключает режим, при котором входящие данные разбиваются на части, парсинг каждой из которых осуществляется параллельно с сохранением исходного порядка. Поддерживается только для форматов [TSV](../../interfaces/formats.md#tabseparated), [TKSV](../../interfaces/formats.md#tskv), [CSV](../../interfaces/formats.md#csv) и [JSONEachRow](../../interfaces/formats.md#jsoneachrow).
+Включает или отключает режим, при котором входящие данные разбиваются на части, парсинг каждой из которых осуществляется параллельно с сохранением исходного порядка. Поддерживается только для форматов [TSV](../../interfaces/formats.md#tabseparated), [TSKV](../../interfaces/formats.md#tskv), [CSV](../../interfaces/formats.md#csv) и [JSONEachRow](../../interfaces/formats.md#jsoneachrow).
 
 Возможные значения:
 
@@ -2260,7 +2260,7 @@ SELECT * FROM test_table
 
 ## output_format_parallel_formatting {#output-format-parallel-formatting}
 
-Включает или отключает режим, при котором исходящие данные форматируются параллельно с сохранением исходного порядка. Поддерживается только для форматов [TSV](../../interfaces/formats.md#tabseparated), [TKSV](../../interfaces/formats.md#tskv), [CSV](../../interfaces/formats.md#csv) и [JSONEachRow](../../interfaces/formats.md#jsoneachrow).
+Включает или отключает режим, при котором исходящие данные форматируются параллельно с сохранением исходного порядка. Поддерживается только для форматов [TSV](../../interfaces/formats.md#tabseparated), [TSKV](../../interfaces/formats.md#tskv), [CSV](../../interfaces/formats.md#csv) и [JSONEachRow](../../interfaces/formats.md#jsoneachrow).
 
 Возможные значения:
 
diff --git a/docs/ru/operations/system-tables/storage_policies.md b/docs/ru/operations/system-tables/storage_policies.md
index 8c3f117ca91..dbb91a8ec1a 100644
--- a/docs/ru/operations/system-tables/storage_policies.md
+++ b/docs/ru/operations/system-tables/storage_policies.md
@@ -13,6 +13,5 @@ slug: /ru/operations/system-tables/storage_policies
 -   `disks` ([Array(String)](../../sql-reference/data-types/array.md)) — имена дисков, содержащихся в политике хранения.
 -   `max_data_part_size` ([UInt64](../../sql-reference/data-types/int-uint.md)) — максимальный размер куска данных, который может храниться на дисках тома (0 — без ограничений).
 -   `move_factor` — доля доступного свободного места на томе, если места становится меньше, то данные начнут перемещение на следующий том, если он есть (по умолчанию 0.1).
--   `prefer_not_to_merge` ([UInt8](../../sql-reference/data-types/int-uint.md)) — Значение настройки `prefer_not_to_merge`. Если данная настройка включена, то слияние данных, хранящихся на данном томе, не допускается. Это позволяет контролировать работу ClickHouse с медленными дисками.
 
 Если политика хранения содержит несколько томов, то каждому тому соответствует отдельная запись в таблице.
diff --git a/docs/ru/operations/utilities/clickhouse-format.md b/docs/ru/operations/utilities/clickhouse-format.md
index af66930b368..9c4b7304940 100644
--- a/docs/ru/operations/utilities/clickhouse-format.md
+++ b/docs/ru/operations/utilities/clickhouse-format.md
@@ -1,115 +1,115 @@
----
+---
 slug: /ru/operations/utilities/clickhouse-format
-sidebar_position: 65
-sidebar_label: clickhouse-format
----
-
-# clickhouse-format {#clickhouse-format}
-
-Позволяет форматировать входящие запросы.
-
-Ключи:
-
-- `--help` или`-h` — выводит описание ключей.
-- `--query` — форматирует запрос любой длины и сложности.
-- `--hilite` — добавляет подсветку синтаксиса с экранированием символов.
-- `--oneline` — форматирование в одну строку.
-- `--quiet` или `-q` — проверяет синтаксис без вывода результата.
-- `--multiquery` or `-n` — поддерживает несколько запросов в одной строке.
-- `--obfuscate` — обфусцирует вместо форматирования.
-- `--seed <строка>` — задает строку, которая определяет результат обфускации.
-- `--backslash` — добавляет обратный слеш в конце каждой строки отформатированного запроса. Удобно использовать если многострочный запрос скопирован из интернета или другого источника и его нужно выполнить из командной строки.
-
-## Примеры {#examples}
-
-1. Форматирование запроса:
-
-```bash
-$ clickhouse-format --query "select number from numbers(10) where number%2 order by number desc;"
-```
-
-Результат:
-
-```text
-SELECT number
-FROM numbers(10)
-WHERE number % 2
-ORDER BY number DESC
-```
-
-2. Подсветка синтаксиса и форматирование в одну строку:
-
-```bash
-$ clickhouse-format --oneline --hilite <<< "SELECT sum(number) FROM numbers(5);"
-```
-
-Результат:
-
-```sql
-SELECT sum(number) FROM numbers(5)
-```
-
-3. Несколько запросов в одной строке:
-
-```bash
-$ clickhouse-format -n <<< "SELECT * FROM (SELECT 1 AS x UNION ALL SELECT 1 UNION DISTINCT SELECT 3);"
-```
-
-Результат:
-
-```text
-SELECT *
-FROM
-(
-    SELECT 1 AS x
-    UNION ALL
-    SELECT 1
-    UNION DISTINCT
-    SELECT 3
-)
-;
-```
-
-4. Обфускация:
-
-```bash
-$ clickhouse-format --seed Hello --obfuscate <<< "SELECT cost_first_screen BETWEEN a AND b, CASE WHEN x >= 123 THEN y ELSE NULL END;"
-```
-
-Результат:
-
-```text
-SELECT treasury_mammoth_hazelnut BETWEEN nutmeg AND span, CASE WHEN chive >= 116 THEN switching ELSE ANYTHING END;
-```
-
-Тот же запрос с другой инициализацией обфускатора:
-
-```bash
-$ clickhouse-format --seed World --obfuscate <<< "SELECT cost_first_screen BETWEEN a AND b, CASE WHEN x >= 123 THEN y ELSE NULL END;"
-```
-
-Результат:
-
-```text
-SELECT horse_tape_summer BETWEEN folklore AND moccasins, CASE WHEN intestine >= 116 THEN nonconformist ELSE FORESTRY END;
-```
-
-5. Добавление обратного слеша:
-
-```bash
-$ clickhouse-format --backslash <<< "SELECT * FROM (SELECT 1 AS x UNION ALL SELECT 1 UNION DISTINCT SELECT 3);"
-```
-
-Результат:
-
-```text
-SELECT * \
-FROM  \
-( \
-    SELECT 1 AS x \
-    UNION ALL \
-    SELECT 1 \
-    UNION DISTINCT \
-    SELECT 3 \
-)
-```
+sidebar_position: 65
+sidebar_label: clickhouse-format
+---
+
+# clickhouse-format {#clickhouse-format}
+
+Позволяет форматировать входящие запросы.
+
+Ключи:
+
+- `--help` или`-h` — выводит описание ключей.
+- `--query` — форматирует запрос любой длины и сложности.
+- `--hilite` — добавляет подсветку синтаксиса с экранированием символов.
+- `--oneline` — форматирование в одну строку.
+- `--quiet` или `-q` — проверяет синтаксис без вывода результата.
+- `--multiquery` or `-n` — поддерживает несколько запросов в одной строке.
+- `--obfuscate` — обфусцирует вместо форматирования.
+- `--seed <строка>` — задает строку, которая определяет результат обфускации.
+- `--backslash` — добавляет обратный слеш в конце каждой строки отформатированного запроса. Удобно использовать если многострочный запрос скопирован из интернета или другого источника и его нужно выполнить из командной строки.
+
+## Примеры {#examples}
+
+1. Форматирование запроса:
+
+```bash
+$ clickhouse-format --query "select number from numbers(10) where number%2 order by number desc;"
+```
+
+Результат:
+
+```text
+SELECT number
+FROM numbers(10)
+WHERE number % 2
+ORDER BY number DESC
+```
+
+2. Подсветка синтаксиса и форматирование в одну строку:
+
+```bash
+$ clickhouse-format --oneline --hilite <<< "SELECT sum(number) FROM numbers(5);"
+```
+
+Результат:
+
+```sql
+SELECT sum(number) FROM numbers(5)
+```
+
+3. Несколько запросов в одной строке:
+
+```bash
+$ clickhouse-format -n <<< "SELECT * FROM (SELECT 1 AS x UNION ALL SELECT 1 UNION DISTINCT SELECT 3);"
+```
+
+Результат:
+
+```text
+SELECT *
+FROM
+(
+    SELECT 1 AS x
+    UNION ALL
+    SELECT 1
+    UNION DISTINCT
+    SELECT 3
+)
+;
+```
+
+4. Обфускация:
+
+```bash
+$ clickhouse-format --seed Hello --obfuscate <<< "SELECT cost_first_screen BETWEEN a AND b, CASE WHEN x >= 123 THEN y ELSE NULL END;"
+```
+
+Результат:
+
+```text
+SELECT treasury_mammoth_hazelnut BETWEEN nutmeg AND span, CASE WHEN chive >= 116 THEN switching ELSE ANYTHING END;
+```
+
+Тот же запрос с другой инициализацией обфускатора:
+
+```bash
+$ clickhouse-format --seed World --obfuscate <<< "SELECT cost_first_screen BETWEEN a AND b, CASE WHEN x >= 123 THEN y ELSE NULL END;"
+```
+
+Результат:
+
+```text
+SELECT horse_tape_summer BETWEEN folklore AND moccasins, CASE WHEN intestine >= 116 THEN nonconformist ELSE FORESTRY END;
+```
+
+5. Добавление обратного слеша:
+
+```bash
+$ clickhouse-format --backslash <<< "SELECT * FROM (SELECT 1 AS x UNION ALL SELECT 1 UNION DISTINCT SELECT 3);"
+```
+
+Результат:
+
+```text
+SELECT * \
+FROM  \
+( \
+    SELECT 1 AS x \
+    UNION ALL \
+    SELECT 1 \
+    UNION DISTINCT \
+    SELECT 3 \
+)
+```
diff --git a/docs/ru/sql-reference/aggregate-functions/reference/sparkbar.md b/docs/ru/sql-reference/aggregate-functions/reference/sparkbar.md
index 958a4bd3504..3b36ee04095 100644
--- a/docs/ru/sql-reference/aggregate-functions/reference/sparkbar.md
+++ b/docs/ru/sql-reference/aggregate-functions/reference/sparkbar.md
@@ -1,62 +1,62 @@
----
-slug: /ru/sql-reference/aggregate-functions/reference/sparkbar
-sidebar_position: 311
-sidebar_label: sparkbar
----
-
-# sparkbar {#sparkbar}
-
-Функция строит гистограмму частот по заданным значениям `x` и частоте повторения этих значений `y` на интервале `[min_x, max_x]`. Повторения для всех `x`, попавших в один бакет, усредняются, поэтому данные должны быть предварительно агрегированы. Отрицательные повторения игнорируются.
-
-Если интервал для построения не указан, то в качестве нижней границы интервала будет взято минимальное значение `x`, а в качестве верхней границы — максимальное значение `x`.
-Значения `x` вне указанного интервала игнорируются.
-
-
-**Синтаксис**
-
-``` sql
-sparkbar(width[, min_x, max_x])(x, y)
-```
-
-**Параметры**
-
--   `width` — Количество столбцов гистограммы. Тип: [Integer](../../../sql-reference/data-types/int-uint.md).
-
--   `min_x` — Начало интервала. Необязательный параметр.
--   `max_x` — Конец интервала. Необязательный параметр.
-
-**Аргументы**
-
--   `x` — Поле со значениями.
--   `y` — Поле с частотой повторения значений.
-
-
-**Возвращаемые значения**
-
--   Гистограмма частот.
-
-**Пример**
-
-Запрос:
-
-``` sql
-CREATE TABLE spark_bar_data (`value` Int64, `event_date` Date) ENGINE = MergeTree ORDER BY event_date;
-
-INSERT INTO spark_bar_data VALUES (1,'2020-01-01'), (3,'2020-01-02'), (4,'2020-01-02'), (-3,'2020-01-02'), (5,'2020-01-03'), (2,'2020-01-04'), (3,'2020-01-05'), (7,'2020-01-06'), (6,'2020-01-07'), (8,'2020-01-08'), (2,'2020-01-11');
-
-SELECT sparkbar(9)(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
-
-SELECT sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
-```
-
-Результат:
-
-``` text
-┌─sparkbar(9)(event_date, cnt)─┐
-│ ▂▅▂▃▆█  ▂                    │
-└──────────────────────────────┘
-
-┌─sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date, cnt)─┐
-│ ▂▅▂▃▇▆█                                                                  │
-└──────────────────────────────────────────────────────────────────────────┘
-```
+---
+slug: /ru/sql-reference/aggregate-functions/reference/sparkbar
+sidebar_position: 311
+sidebar_label: sparkbar
+---
+
+# sparkbar {#sparkbar}
+
+Функция строит гистограмму частот по заданным значениям `x` и частоте повторения этих значений `y` на интервале `[min_x, max_x]`. Повторения для всех `x`, попавших в один бакет, усредняются, поэтому данные должны быть предварительно агрегированы. Отрицательные повторения игнорируются.
+
+Если интервал для построения не указан, то в качестве нижней границы интервала будет взято минимальное значение `x`, а в качестве верхней границы — максимальное значение `x`.
+Значения `x` вне указанного интервала игнорируются.
+
+
+**Синтаксис**
+
+``` sql
+sparkbar(width[, min_x, max_x])(x, y)
+```
+
+**Параметры**
+
+-   `width` — Количество столбцов гистограммы. Тип: [Integer](../../../sql-reference/data-types/int-uint.md).
+
+-   `min_x` — Начало интервала. Необязательный параметр.
+-   `max_x` — Конец интервала. Необязательный параметр.
+
+**Аргументы**
+
+-   `x` — Поле со значениями.
+-   `y` — Поле с частотой повторения значений.
+
+
+**Возвращаемые значения**
+
+-   Гистограмма частот.
+
+**Пример**
+
+Запрос:
+
+``` sql
+CREATE TABLE spark_bar_data (`value` Int64, `event_date` Date) ENGINE = MergeTree ORDER BY event_date;
+
+INSERT INTO spark_bar_data VALUES (1,'2020-01-01'), (3,'2020-01-02'), (4,'2020-01-02'), (-3,'2020-01-02'), (5,'2020-01-03'), (2,'2020-01-04'), (3,'2020-01-05'), (7,'2020-01-06'), (6,'2020-01-07'), (8,'2020-01-08'), (2,'2020-01-11');
+
+SELECT sparkbar(9)(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
+
+SELECT sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_data GROUP BY event_date);
+```
+
+Результат:
+
+``` text
+┌─sparkbar(9)(event_date, cnt)─┐
+│ ▂▅▂▃▆█  ▂                    │
+└──────────────────────────────┘
+
+┌─sparkbar(9, toDate('2020-01-01'), toDate('2020-01-10'))(event_date, cnt)─┐
+│ ▂▅▂▃▇▆█                                                                  │
+└──────────────────────────────────────────────────────────────────────────┘
+```
diff --git a/docs/ru/sql-reference/table-functions/file.md b/docs/ru/sql-reference/table-functions/file.md
index 7c709619679..5331cf00728 100644
--- a/docs/ru/sql-reference/table-functions/file.md
+++ b/docs/ru/sql-reference/table-functions/file.md
@@ -76,14 +76,16 @@ SELECT * FROM file('test.csv', 'CSV', 'column1 UInt32, column2 UInt32, column3 U
 
 ## Шаблоны поиска в компонентах пути {#globs-in-path}
 
-При описании пути к файлу могут использоваться шаблоны поиска. Обрабатываются только те файлы, у которых путь и название соответствуют шаблону полностью (а не только префикс или суффикс).
+Путь к файлу может содержать шаблоны в режиме доступа только для чтения.
+Шаблоны могут содержаться в разных частях пути.
+Обрабатываться будут те и только те файлы, которые существуют в файловой системе и удовлетворяют всему шаблону пути.
 
 -   `*` — заменяет любое количество любых символов кроме `/`, включая отсутствие символов.
 -   `?` — заменяет ровно один любой символ.
 -   `{some_string,another_string,yet_another_one}` — заменяет любую из строк `'some_string', 'another_string', 'yet_another_one'`. Эти строки также могут содержать символ `/`.
 -   `{N..M}` — заменяет любое число в интервале от `N` до `M` включительно (может содержать ведущие нули).
 
-Конструкция с `{}` аналогична табличной функции [remote](remote.md).
+Конструкция с `{}` аналогична табличным функциям [remote](remote.md), [hdfs](hdfs.md).
 
 **Пример**
 
diff --git a/docs/ru/sql-reference/table-functions/fileCluster.md b/docs/ru/sql-reference/table-functions/fileCluster.md
index 7385f4859dc..2f2145b6dba 100644
--- a/docs/ru/sql-reference/table-functions/fileCluster.md
+++ b/docs/ru/sql-reference/table-functions/fileCluster.md
@@ -44,7 +44,7 @@ $ cat /var/lib/clickhouse/user_files/test1.csv
     1,"file1"
     11,"file11"
 
-$ cat /var/lib/clickhouse/user_files/test1.csv
+$ cat /var/lib/clickhouse/user_files/test2.csv
     2,"file2"
     22,"file22"
 ```
diff --git a/docs/ru/sql-reference/table-functions/hdfs.md b/docs/ru/sql-reference/table-functions/hdfs.md
index b70de5e3a4f..6dcb1a21791 100644
--- a/docs/ru/sql-reference/table-functions/hdfs.md
+++ b/docs/ru/sql-reference/table-functions/hdfs.md
@@ -14,7 +14,7 @@ hdfs(URI, format, structure)
 
 **Входные параметры**
 
--   `URI` — URI файла в HDFS. Путь к файлу поддерживает следующие шаблоны в режиме доступа только для чтения `*`, `?`, `{abc,def}` и `{N..M}`, где `N`, `M` — числа, \``'abc', 'def'` — строки.
+-   `URI` — URI файла в HDFS.
 -   `format` — [формат](../../interfaces/formats.md#formats) файла.
 -   `structure` — структура таблицы. Формат `'column1_name column1_type, column2_name column2_type, ...'`.
 
@@ -41,19 +41,22 @@ LIMIT 2
 
 ## Шаблоны поиска в компонентах пути {#globs-in-path}
 
--   `*` — Заменяет любое количество любых символов кроме `/`, включая отсутствие символов.
+Путь к файлу может содержать шаблоны в режиме доступа только для чтения.
+Шаблоны могут содержаться в разных частях пути.
+Обрабатываться будут те и только те файлы, которые существуют в файловой системе и удовлетворяют всему шаблону пути.
+
+
+-   `*` — Заменяет любое количество любых символов (кроме `/`), включая отсутствие символов.
 -   `?` — Заменяет ровно один любой символ.
 -   `{some_string,another_string,yet_another_one}` — Заменяет любую из строк `'some_string', 'another_string', 'yet_another_one'`. Эти строки также могут содержать символ `/`.
 -   `{N..M}` — Заменяет любое число в интервале от `N` до `M` включительно (может содержать ведущие нули).
 
-Конструкция с `{}` аналогична табличной функции [remote](remote.md).
+Конструкция с `{}` аналогична табличной функции [remote](remote.md), [file](file.md).
 
 :::danger Предупреждение
-Если ваш список файлов содержит интервал с ведущими нулями, используйте конструкцию с фигурными скобками для каждой цифры по отдельности или используйте `?`.
+Если ваш список файлов содержит интервал с ведущими нулями, используйте отдельную конструкцию с фигурными скобками для каждой цифры или используйте `?`.
 :::
 
-Шаблоны могут содержаться в разных частях пути. Обрабатываться будут ровно те файлы, которые и удовлетворяют всему шаблону пути, и существуют в файловой системе.
-
 ## Виртуальные столбцы {#virtualnye-stolbtsy}
 
 -   `_path` — Путь к файлу.
diff --git a/docs/ru/sql-reference/table-functions/s3.md b/docs/ru/sql-reference/table-functions/s3.md
index 7deef68f47f..fe40cb0c507 100644
--- a/docs/ru/sql-reference/table-functions/s3.md
+++ b/docs/ru/sql-reference/table-functions/s3.md
@@ -11,7 +11,7 @@ sidebar_label: s3
 **Синтаксис**
 
 ``` sql
-s3(path [,aws_access_key_id, aws_secret_access_key] [,format] [,structure] [,compression])
+s3(path [,access_key_id, secret_access_key [,session_token]] [,format] [,structure] [,compression])
 ```
 
 **Aргументы**
diff --git a/docs/ru/sql-reference/table-functions/s3Cluster.md b/docs/ru/sql-reference/table-functions/s3Cluster.md
index b8f34d805ff..b382bf5e384 100644
--- a/docs/ru/sql-reference/table-functions/s3Cluster.md
+++ b/docs/ru/sql-reference/table-functions/s3Cluster.md
@@ -11,14 +11,14 @@ sidebar_label: s3Cluster
 **Синтаксис**
 
 ``` sql
-s3Cluster(cluster_name, source, [,access_key_id, secret_access_key] [,format] [,structure])
+s3Cluster(cluster_name, source, [,access_key_id, secret_access_key [,session_token]] [,format] [,structure])
 ```
 
 **Аргументы**
 
 -   `cluster_name` — имя кластера, используемое для создания набора адресов и параметров подключения к удаленным и локальным серверам.
 -   `source` — URL файла или нескольких файлов. Поддерживает следующие символы подстановки: `*`, `?`, `{'abc','def'}` и `{N..M}`, где `N`, `M` — числа, `abc`, `def` — строки. Подробнее смотрите в разделе [Символы подстановки](../../engines/table-engines/integrations/s3.md#wildcards-in-path).
--   `access_key_id` и `secret_access_key` — ключи, указывающие на учетные данные для использования с точкой приема запроса. Необязательные параметры.
+-   `access_key_id`, `secret_access_key` и `session_token` — ключи, указывающие на учетные данные для использования с точкой приема запроса. Необязательные параметры.
 -   `format` — [формат](../../interfaces/formats.md#formats) файла.
 -   `structure` — структура таблицы. Формат `'column1_name column1_type, column2_name column2_type, ...'`.
 
diff --git a/docs/zh/development/style.md b/docs/zh/development/style.md
index 977b4dce92a..c0a08291e02 100644
--- a/docs/zh/development/style.md
+++ b/docs/zh/development/style.md
@@ -485,7 +485,7 @@ catch (const DB::Exception & e)
 
 ``` cpp
 if (0 != close(fd))
-    throwFromErrno("Cannot close file " + file_name, ErrorCodes::CANNOT_CLOSE_FILE);
+    throw ErrnoException(ErrorCodes::CANNOT_CLOSE_FILE, "Cannot close file {}", file_name);
 ```
 
 `不要使用断言`。
diff --git a/docs/zh/engines/table-engines/mergetree-family/mergetree.md b/docs/zh/engines/table-engines/mergetree-family/mergetree.md
index c738ae0f24c..bfa69338657 100644
--- a/docs/zh/engines/table-engines/mergetree-family/mergetree.md
+++ b/docs/zh/engines/table-engines/mergetree-family/mergetree.md
@@ -1,821 +1,822 @@
----
-slug: /zh/engines/table-engines/mergetree-family/mergetree
----
-# MergeTree {#table_engines-mergetree}
-
-Clickhouse 中最强大的表引擎当属 `MergeTree` （合并树）引擎及该系列（`*MergeTree`）中的其他引擎。
-
-`MergeTree` 系列的引擎被设计用于插入极大量的数据到一张表当中。数据可以以数据片段的形式一个接着一个的快速写入，数据片段在后台按照一定的规则进行合并。相比在插入时不断修改（重写）已存储的数据，这种策略会高效很多。
-
-主要特点:
-
-- 存储的数据按主键排序。
-
-    这使得您能够创建一个小型的稀疏索引来加快数据检索。
-
-- 如果指定了 [分区键](custom-partitioning-key.md) 的话，可以使用分区。
-
-    在相同数据集和相同结果集的情况下 ClickHouse 中某些带分区的操作会比普通操作更快。查询中指定了分区键时 ClickHouse 会自动截取分区数据。这也有效增加了查询性能。
-
-- 支持数据副本。
-
-    `ReplicatedMergeTree` 系列的表提供了数据副本功能。更多信息，请参阅 [数据副本](replication.md) 一节。
-
-- 支持数据采样。
-
-    需要的话，您可以给表设置一个采样方法。
-
-:::info
-[合并](../special/merge.md#merge) 引擎并不属于 `*MergeTree` 系列。
-:::
-
-## 建表 {#table_engine-mergetree-creating-a-table}
-
-``` sql
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1] [TTL expr1],
-    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2] [TTL expr2],
-    ...
-    INDEX index_name1 expr1 TYPE type1(...) GRANULARITY value1,
-    INDEX index_name2 expr2 TYPE type2(...) GRANULARITY value2
-) ENGINE = MergeTree()
-ORDER BY expr
-[PARTITION BY expr]
-[PRIMARY KEY expr]
-[SAMPLE BY expr]
-[TTL expr [DELETE|TO DISK 'xxx'|TO VOLUME 'xxx'], ...]
-[SETTINGS name=value, ...]
-```
-
-对于以上参数的描述，可参考 [CREATE 语句 的描述](../../../engines/table-engines/mergetree-family/mergetree.md) 。
-
-<a name="mergetree-query-clauses"></a>
-
-**子句**
-
-- `ENGINE` - 引擎名和参数。 `ENGINE = MergeTree()`. `MergeTree` 引擎没有参数。
-
-- `ORDER BY` — 排序键。
-
-     可以是一组列的元组或任意的表达式。 例如: `ORDER BY (CounterID, EventDate)` 。
-
-     如果没有使用 `PRIMARY KEY` 显式指定的主键，ClickHouse 会使用排序键作为主键。
-
-     如果不需要排序，可以使用 `ORDER BY tuple()`. 参考 [选择主键](https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/mergetree/#selecting-the-primary-key)
-
-- `PARTITION BY` — [分区键](custom-partitioning-key.md) ，可选项。
-
-     大多数情况下，不需要使用分区键。即使需要使用，也不需要使用比月更细粒度的分区键。分区不会加快查询（这与 ORDER BY 表达式不同）。永远也别使用过细粒度的分区键。不要使用客户端指定分区标识符或分区字段名称来对数据进行分区（而是将分区字段标识或名称作为 ORDER BY 表达式的第一列来指定分区）。
-
-     要按月分区，可以使用表达式 `toYYYYMM(date_column)` ，这里的 `date_column` 是一个 [Date](../../../engines/table-engines/mergetree-family/mergetree.md) 类型的列。分区名的格式会是 `"YYYYMM"` 。
-
-- `PRIMARY KEY` - 如果要 [选择与排序键不同的主键](#choosing-a-primary-key-that-differs-from-the-sorting-key)，在这里指定，可选项。
-
-    默认情况下主键跟排序键（由 `ORDER BY` 子句指定）相同。
-    因此，大部分情况下不需要再专门指定一个 `PRIMARY KEY` 子句。
-
-- `SAMPLE BY` - 用于抽样的表达式，可选项。
-
-     如果要用抽样表达式，主键中必须包含这个表达式。例如：
-     `SAMPLE BY intHash32(UserID) ORDER BY (CounterID, EventDate, intHash32(UserID))` 。
-
-- `TTL` - 指定行存储的持续时间并定义数据片段在硬盘和卷上的移动逻辑的规则列表，可选项。
-
-    表达式中必须存在至少一个 `Date` 或 `DateTime` 类型的列，比如：
-
-    `TTL date + INTERVAl 1 DAY`
-
-    规则的类型 `DELETE|TO DISK 'xxx'|TO VOLUME 'xxx'`指定了当满足条件（到达指定时间）时所要执行的动作：移除过期的行，还是将数据片段（如果数据片段中的所有行都满足表达式的话）移动到指定的磁盘（`TO DISK 'xxx'`) 或 卷（`TO VOLUME 'xxx'`）。默认的规则是移除（`DELETE`）。可以在列表中指定多个规则，但最多只能有一个`DELETE`的规则。
-
-    更多细节，请查看 [表和列的 TTL](#table_engine-mergetree-ttl)
-
-- `SETTINGS` — 控制 `MergeTree` 行为的额外参数，可选项：
-
-  - `index_granularity` — 索引粒度。索引中相邻的『标记』间的数据行数。默认值8192 。参考[数据存储](#mergetree-data-storage)。
-  - `index_granularity_bytes` — 索引粒度，以字节为单位，默认值: 10Mb。如果想要仅按数据行数限制索引粒度, 请设置为0(不建议)。
-  - `min_index_granularity_bytes` - 允许的最小数据粒度，默认值：1024b。该选项用于防止误操作，添加了一个非常低索引粒度的表。参考[数据存储](#mergetree-data-storage)
-  - `enable_mixed_granularity_parts` — 是否启用通过 `index_granularity_bytes` 控制索引粒度的大小。在19.11版本之前, 只有 `index_granularity` 配置能够用于限制索引粒度的大小。当从具有很大的行（几十上百兆字节）的表中查询数据时候，`index_granularity_bytes` 配置能够提升ClickHouse的性能。如果您的表里有很大的行，可以开启这项配置来提升`SELECT` 查询的性能。
-  - `use_minimalistic_part_header_in_zookeeper` — ZooKeeper中数据片段存储方式 。如果`use_minimalistic_part_header_in_zookeeper=1` ，ZooKeeper 会存储更少的数据。更多信息参考[服务配置参数]([Server Settings | ClickHouse Documentation](https://clickhouse.com/docs/zh/operations/server-configuration-parameters/settings/))这章中的 [设置描述](../../../operations/server-configuration-parameters/settings.md#server-settings-use_minimalistic_part_header_in_zookeeper) 。
-  - `min_merge_bytes_to_use_direct_io` — 使用直接 I/O 来操作磁盘的合并操作时要求的最小数据量。合并数据片段时，ClickHouse 会计算要被合并的所有数据的总存储空间。如果大小超过了 `min_merge_bytes_to_use_direct_io` 设置的字节数，则 ClickHouse 将使用直接 I/O 接口（`O_DIRECT` 选项）对磁盘读写。如果设置 `min_merge_bytes_to_use_direct_io = 0` ，则会禁用直接 I/O。默认值：`10 * 1024 * 1024 * 1024` 字节。
-        <a name="mergetree_setting-merge_with_ttl_timeout"></a>
-  - `merge_with_ttl_timeout` — TTL合并频率的最小间隔时间，单位：秒。默认值: 86400 (1 天)。
-  - `write_final_mark` — 是否启用在数据片段尾部写入最终索引标记。默认值: 1（不要关闭）。
-  - `merge_max_block_size` — 在块中进行合并操作时的最大行数限制。默认值：8192
-  - `storage_policy` — 存储策略。 参见 [使用具有多个块的设备进行数据存储](#table_engine-mergetree-multiple-volumes).
-  - `min_bytes_for_wide_part`,`min_rows_for_wide_part` 在数据片段中可以使用`Wide`格式进行存储的最小字节数/行数。您可以不设置、只设置一个，或全都设置。参考：[数据存储](#mergetree-data-storage)
-  - `max_parts_in_total` - 所有分区中最大块的数量(意义不明)
-  - `max_compress_block_size` - 在数据压缩写入表前，未压缩数据块的最大大小。您可以在全局设置中设置该值(参见[max_compress_block_size](https://clickhouse.com/docs/zh/operations/settings/settings/#max-compress-block-size))。建表时指定该值会覆盖全局设置。
-  - `min_compress_block_size` - 在数据压缩写入表前，未压缩数据块的最小大小。您可以在全局设置中设置该值(参见[min_compress_block_size](https://clickhouse.com/docs/zh/operations/settings/settings/#min-compress-block-size))。建表时指定该值会覆盖全局设置。
-  - `max_partitions_to_read` - 一次查询中可访问的分区最大数。您可以在全局设置中设置该值(参见[max_partitions_to_read](https://clickhouse.com/docs/zh/operations/settings/settings/#max_partitions_to_read))。
-
-**示例配置**
-
-``` sql
-ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate, intHash32(UserID)) SAMPLE BY intHash32(UserID) SETTINGS index_granularity=8192
-```
-
-在这个例子中，我们设置了按月进行分区。
-
-同时我们设置了一个按用户 ID 哈希的抽样表达式。这使得您可以对该表中每个 `CounterID` 和 `EventDate` 的数据伪随机分布。如果您在查询时指定了 [SAMPLE](../../../engines/table-engines/mergetree-family/mergetree.md#select-sample-clause) 子句。 ClickHouse会返回对于用户子集的一个均匀的伪随机数据采样。
-
-`index_granularity` 可省略因为 8192 是默认设置 。
-
-<details markdown="1">
-<summary>已弃用的建表方法</summary>
-
-:::attention "注意"
-不要在新版项目中使用该方法，可能的话，请将旧项目切换到上述方法。
-:::
-
-``` sql
-CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
-(
-    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
-    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
-    ...
-) ENGINE [=] MergeTree(date-column [, sampling_expression], (primary, key), index_granularity)
-```
-
-**MergeTree() 参数**
-
-- `date-column` — 类型为 [日期](../../../engines/table-engines/mergetree-family/mergetree.md) 的列名。ClickHouse 会自动依据这个列按月创建分区。分区名格式为 `"YYYYMM"` 。
-- `sampling_expression` — 采样表达式。
-- `(primary, key)` — 主键。类型 — [元组()](../../../engines/table-engines/mergetree-family/mergetree.md)
-- `index_granularity` — 索引粒度。即索引中相邻『标记』间的数据行数。设为 8192 可以适用大部分场景。
-
-**示例**
-
-    MergeTree(EventDate, intHash32(UserID), (CounterID, EventDate, intHash32(UserID)), 8192)
-
-对于主要的配置方法，这里 `MergeTree` 引擎跟前面的例子一样，可以以同样的方式配置。
-</details>
-
-## 数据存储 {#mergetree-data-storage}
-
-表由按主键排序的数据片段（DATA PART）组成。
-
-当数据被插入到表中时，会创建多个数据片段并按主键的字典序排序。例如，主键是 `(CounterID, Date)` 时，片段中数据首先按 `CounterID` 排序，具有相同 `CounterID` 的部分按 `Date` 排序。
-
-不同分区的数据会被分成不同的片段，ClickHouse 在后台合并数据片段以便更高效存储。不同分区的数据片段不会进行合并。合并机制并不保证具有相同主键的行全都合并到同一个数据片段中。
-
-数据片段可以以 `Wide` 或 `Compact` 格式存储。在 `Wide` 格式下，每一列都会在文件系统中存储为单独的文件，在 `Compact` 格式下所有列都存储在一个文件中。`Compact` 格式可以提高插入量少插入频率频繁时的性能。
-
-数据存储格式由 `min_bytes_for_wide_part` 和 `min_rows_for_wide_part` 表引擎参数控制。如果数据片段中的字节数或行数少于相应的设置值，数据片段会以 `Compact` 格式存储，否则会以 `Wide` 格式存储。
-
-每个数据片段被逻辑的分割成颗粒（granules）。颗粒是 ClickHouse 中进行数据查询时的最小不可分割数据集。ClickHouse 不会对行或值进行拆分，所以每个颗粒总是包含整数个行。每个颗粒的第一行通过该行的主键值进行标记，
-ClickHouse 会为每个数据片段创建一个索引文件来存储这些标记。对于每列，无论它是否包含在主键当中，ClickHouse 都会存储类似标记。这些标记让您可以在列文件中直接找到数据。
-
-颗粒的大小通过表引擎参数 `index_granularity` 和 `index_granularity_bytes` 控制。颗粒的行数的在 `[1, index_granularity]` 范围中，这取决于行的大小。如果单行的大小超过了 `index_granularity_bytes` 设置的值，那么一个颗粒的大小会超过 `index_granularity_bytes`。在这种情况下，颗粒的大小等于该行的大小。
-
-## 主键和索引在查询中的表现 {#primary-keys-and-indexes-in-queries}
-
-我们以 `(CounterID, Date)` 以主键。排序好的索引的图示会是下面这样：
-
-``` text
-    全部数据  :     [-------------------------------------------------------------------------]
-    CounterID:      [aaaaaaaaaaaaaaaaaabbbbcdeeeeeeeeeeeeefgggggggghhhhhhhhhiiiiiiiiikllllllll]
-    Date:           [1111111222222233331233211111222222333211111112122222223111112223311122333]
-    标记:            |      |      |      |      |      |      |      |      |      |      |
-                    a,1    a,2    a,3    b,3    e,2    e,3    g,1    h,2    i,1    i,3    l,3
-    标记号:          0      1      2      3      4      5      6      7      8      9      10
-```
-
-如果指定查询如下：
-
-- `CounterID in ('a', 'h')`，服务器会读取标记号在 `[0, 3)` 和 `[6, 8)` 区间中的数据。
-- `CounterID IN ('a', 'h') AND Date = 3`，服务器会读取标记号在 `[1, 3)` 和 `[7, 8)` 区间中的数据。
-- `Date = 3`，服务器会读取标记号在 `[1, 10]` 区间中的数据。
-
-上面例子可以看出使用索引通常会比全表描述要高效。
-
-稀疏索引会引起额外的数据读取。当读取主键单个区间范围的数据时，每个数据块中最多会多读 `index_granularity * 2` 行额外的数据。
-
-稀疏索引使得您可以处理极大量的行，因为大多数情况下，这些索引常驻于内存。
-
-ClickHouse 不要求主键唯一，所以您可以插入多条具有相同主键的行。
-
-您可以在`PRIMARY KEY`与`ORDER BY`条件中使用`可为空的`类型的表达式，但强烈建议不要这么做。为了启用这项功能，请打开[allow_nullable_key](../../../operations/settings/index.md#allow-nullable-key)，[NULLS_LAST](../../../sql-reference/statements/select/order-by.md#sorting-of-special-values)规则也适用于`ORDER BY`条件中有NULL值的情况下。
-
-### 主键的选择 {#zhu-jian-de-xuan-ze}
-
-主键中列的数量并没有明确的限制。依据数据结构，您可以在主键包含多些或少些列。这样可以：
-
-  - 改善索引的性能。
-
-  - 如果当前主键是 `(a, b)` ，在下列情况下添加另一个 `c` 列会提升性能：
-
-  - 查询会使用 `c` 列作为条件
-  - 很长的数据范围（ `index_granularity` 的数倍）里 `(a, b)` 都是相同的值，并且这样的情况很普遍。换言之，就是加入另一列后，可以让您的查询略过很长的数据范围。
-
-  - 改善数据压缩。
-
-    ClickHouse 以主键排序片段数据，所以，数据的一致性越高，压缩越好。
-
-  - 在[CollapsingMergeTree](collapsingmergetree.md#table_engine-collapsingmergetree) 和 [SummingMergeTree](summingmergetree.md) 引擎里进行数据合并时会提供额外的处理逻辑。
-
-    在这种情况下，指定与主键不同的 *排序键* 也是有意义的。
-
-长的主键会对插入性能和内存消耗有负面影响，但主键中额外的列并不影响 `SELECT` 查询的性能。
-
-可以使用 `ORDER BY tuple()` 语法创建没有主键的表。在这种情况下 ClickHouse 根据数据插入的顺序存储。如果在使用 `INSERT ... SELECT` 时希望保持数据的排序，请设置 [max_insert_threads = 1](../../../operations/settings/settings.md#settings-max-insert-threads)。
-
-想要根据初始顺序进行数据查询，使用 [单线程查询](../../../operations/settings/settings.md#settings-max_threads)
-
-### 选择与排序键不同的主键 {#choosing-a-primary-key-that-differs-from-the-sorting-key}
-
-Clickhouse可以做到指定一个跟排序键不一样的主键，此时排序键用于在数据片段中进行排序，主键用于在索引文件中进行标记的写入。这种情况下，主键表达式元组必须是排序键表达式元组的前缀(即主键为(a,b)，排序列必须为(a,b,******))。
-
-当使用 [SummingMergeTree](summingmergetree.md) 和 [AggregatingMergeTree](aggregatingmergetree.md) 引擎时，这个特性非常有用。通常在使用这类引擎时，表里的列分两种：*维度* 和 *度量* 。典型的查询会通过任意的 `GROUP BY` 对度量列进行聚合并通过维度列进行过滤。由于 SummingMergeTree 和 AggregatingMergeTree 会对排序键相同的行进行聚合，所以把所有的维度放进排序键是很自然的做法。但这将导致排序键中包含大量的列，并且排序键会伴随着新添加的维度不断的更新。
-
-在这种情况下合理的做法是，只保留少量的列在主键当中用于提升扫描效率，将维度列添加到排序键中。
-
-对排序键进行 [ALTER](../../../sql-reference/statements/alter.md) 是轻量级的操作，因为当一个新列同时被加入到表里和排序键里时，已存在的数据片段并不需要修改。由于旧的排序键是新排序键的前缀，并且新添加的列中没有数据，因此在表修改时的数据对于新旧的排序键来说都是有序的。
-
-### 索引和分区在查询中的应用 {#use-of-indexes-and-partitions-in-queries}
-
-对于 `SELECT` 查询，ClickHouse 分析是否可以使用索引。如果 `WHERE/PREWHERE` 子句具有下面这些表达式（作为完整WHERE条件的一部分或全部）则可以使用索引：进行相等/不相等的比较；对主键列或分区列进行`IN`运算、有固定前缀的`LIKE`运算(如name like 'test%')、函数运算(部分函数适用)，还有对上述表达式进行逻辑运算。
-
-
-因此，在索引键的一个或多个区间上快速地执行查询是可能的。下面例子中，指定标签；指定标签和日期范围；指定标签和日期；指定多个标签和日期范围等执行查询，都会非常快。
-
-当引擎配置如下时：
-
-``` sql
-    ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate) SETTINGS index_granularity=8192
-```
-
-这种情况下，这些查询：
-
-``` sql
-SELECT count() FROM table WHERE EventDate = toDate(now()) AND CounterID = 34
-SELECT count() FROM table WHERE EventDate = toDate(now()) AND (CounterID = 34 OR CounterID = 42)
-SELECT count() FROM table WHERE ((EventDate >= toDate('2014-01-01') AND EventDate <= toDate('2014-01-31')) OR EventDate = toDate('2014-05-01')) AND CounterID IN (101500, 731962, 160656) AND (CounterID = 101500 OR EventDate != toDate('2014-05-01'))
-```
-
-ClickHouse 会依据主键索引剪掉不符合的数据，依据按月分区的分区键剪掉那些不包含符合数据的分区。
-
-上文的查询显示，即使索引用于复杂表达式，因为读表操作经过优化，所以使用索引不会比完整扫描慢。
-
-下面这个例子中，不会使用索引。
-
-``` sql
-SELECT count() FROM table WHERE CounterID = 34 OR URL LIKE '%upyachka%'
-```
-
-要检查 ClickHouse 执行一个查询时能否使用索引，可设置 [force_index_by_date](../../../operations/settings/settings.md#settings-force_index_by_date) 和 [force_primary_key](../../../operations/settings/settings.md) 。
-
-使用按月分区的分区列允许只读取包含适当日期区间的数据块，这种情况下，数据块会包含很多天（最多整月）的数据。在块中，数据按主键排序，主键第一列可能不包含日期。因此，仅使用日期而没有用主键字段作为条件的查询将会导致需要读取超过这个指定日期以外的数据。
-
-### 部分单调主键的使用
-
-考虑这样的场景，比如一个月中的天数。它们在一个月的范围内形成一个[单调序列](https://zh.wikipedia.org/wiki/单调函数) ，但如果扩展到更大的时间范围它们就不再单调了。这就是一个部分单调序列。如果用户使用部分单调的主键创建表，ClickHouse同样会创建一个稀疏索引。当用户从这类表中查询数据时，ClickHouse 会对查询条件进行分析。如果用户希望获取两个索引标记之间的数据并且这两个标记在一个月以内，ClickHouse 可以在这种特殊情况下使用到索引，因为它可以计算出查询参数与索引标记之间的距离。
-
-如果查询参数范围内的主键不是单调序列，那么 ClickHouse 无法使用索引。在这种情况下，ClickHouse 会进行全表扫描。
-
-ClickHouse 在任何主键代表一个部分单调序列的情况下都会使用这个逻辑。
-
-### 跳数索引 {#tiao-shu-suo-yin-fen-duan-hui-zong-suo-yin-shi-yan-xing-de}
-
-此索引在 `CREATE` 语句的列部分里定义。
-
-``` sql
-INDEX index_name expr TYPE type(...) GRANULARITY granularity_value
-```
-
-`*MergeTree` 系列的表可以指定跳数索引。
-跳数索引是指数据片段按照粒度(建表时指定的`index_granularity`)分割成小块后，将上述SQL的granularity_value数量的小块组合成一个大的块，对这些大块写入索引信息，这样有助于使用`where`筛选时跳过大量不必要的数据，减少`SELECT`需要读取的数据量。
-
-**示例**
-
-``` sql
-CREATE TABLE table_name
-(
-    u64 UInt64,
-    i32 Int32,
-    s String,
-    ...
-    INDEX a (u64 * i32, s) TYPE minmax GRANULARITY 3,
-    INDEX b (u64 * length(s)) TYPE set(1000) GRANULARITY 4
-) ENGINE = MergeTree()
-...
-```
-
-上例中的索引能让 ClickHouse 执行下面这些查询时减少读取数据量。
-
-``` sql
-SELECT count() FROM table WHERE s < 'z'
-SELECT count() FROM table WHERE u64 * i32 == 10 AND u64 * length(s) >= 1234
-```
-
-#### 可用的索引类型 {#table_engine-mergetree-data_skipping-indexes}
-
-- `minmax`
-    存储指定表达式的极值（如果表达式是 `tuple` ，则存储 `tuple` 中每个元素的极值），这些信息用于跳过数据块，类似主键。
-
-- `set(max_rows)`
-    存储指定表达式的不重复值（不超过 `max_rows` 个，`max_rows=0` 则表示『无限制』）。这些信息可用于检查数据块是否满足 `WHERE` 条件。
-
-- `ngrambf_v1(n, size_of_bloom_filter_in_bytes, number_of_hash_functions, random_seed)`
-    存储一个包含数据块中所有 n元短语（ngram） 的 [布隆过滤器](https://en.wikipedia.org/wiki/Bloom_filter) 。只可用在字符串上。
-    可用于优化 `equals` ， `like` 和 `in` 表达式的性能。
-  - `n` – 短语长度。
-  - `size_of_bloom_filter_in_bytes` – 布隆过滤器大小，字节为单位。（因为压缩得好，可以指定比较大的值，如 256 或 512）。
-  - `number_of_hash_functions` – 布隆过滤器中使用的哈希函数的个数。
-  - `random_seed` – 哈希函数的随机种子。
-
-- `tokenbf_v1(size_of_bloom_filter_in_bytes, number_of_hash_functions, random_seed)`
-    跟 `ngrambf_v1` 类似，但是存储的是token而不是ngrams。Token是由非字母数字的符号分割的序列。
-
-- `bloom_filter(bloom_filter([false_positive])` – 为指定的列存储布隆过滤器
-
-    可选参数`false_positive`用来指定从布隆过滤器收到错误响应的几率。取值范围是 (0,1)，默认值：0.025
-
-    支持的数据类型：`Int*`, `UInt*`, `Float*`, `Enum`, `Date`, `DateTime`, `String`, `FixedString`, `Array`, `LowCardinality`, `Nullable`。
-
-    以下函数会用到这个索引： [equals](../../../sql-reference/functions/comparison-functions.md), [notEquals](../../../sql-reference/functions/comparison-functions.md), [in](../../../sql-reference/functions/in-functions.md), [notIn](../../../sql-reference/functions/in-functions.md), [has](../../../sql-reference/functions/array-functions.md)
-
-``` sql
-INDEX sample_index (u64 * length(s)) TYPE minmax GRANULARITY 4
-INDEX sample_index2 (u64 * length(str), i32 + f64 * 100, date, str) TYPE set(100) GRANULARITY 4
-INDEX sample_index3 (lower(str), str) TYPE ngrambf_v1(3, 256, 2, 0) GRANULARITY 4
-```
-
-#### 函数支持 {#functions-support}
-
-WHERE 子句中的条件可以包含对某列数据进行运算的函数表达式，如果列是索引的一部分，ClickHouse会在执行函数时尝试使用索引。不同的函数对索引的支持是不同的。
-
-`set` 索引会对所有函数生效，其他索引对函数的生效情况见下表
-
-| 函数 (操作符) / 索引                                         | primary key | minmax | ngrambf_v1 | tokenbf_v1 | bloom_filter |
-| ------------------------------------------------------------ | ----------- | ------ | ---------- | ---------- | ------------ |
-| [equals (=, ==)](../../../sql-reference/functions/comparison-functions.md#equals) | ✔           | ✔      | ✔          | ✔          | ✔            |
-| [notEquals(!=, &lt;&gt;)](../../../sql-reference/functions/comparison-functions.md#notequals) | ✔           | ✔      | ✔          | ✔          | ✔            |
-| [like](../../../sql-reference/functions/string-search-functions.md#function-like) | ✔           | ✔      | ✔          | ✔          | ✔            |
-| [notLike](../../../sql-reference/functions/string-search-functions.md#function-notlike) | ✔           | ✔      | ✗          | ✗          | ✗            |
-| [startsWith](../../../sql-reference/functions/string-functions.md#startswith) | ✔           | ✔      | ✔          | ✔          | ✗            |
-| [endsWith](../../../sql-reference/functions/string-functions.md#endswith) | ✗           | ✗      | ✔          | ✔          | ✗            |
-| [multiSearchAny](../../../sql-reference/functions/string-search-functions.md#function-multisearchany) | ✗           | ✗      | ✔          | ✗          | ✗            |
-| [in](../../../sql-reference/functions/in-functions.md#in-functions) | ✔           | ✔      | ✔          | ✔          | ✔            |
-| [notIn](../../../sql-reference/functions/in-functions.md#in-functions) | ✔           | ✔      | ✔          | ✔          | ✔            |
-| [less (\<)](../../../sql-reference/functions/comparison-functions.md#less) | ✔           | ✔      | ✗          | ✗          | ✗            |
-| [greater (\>)](../../../sql-reference/functions/comparison-functions.md#greater) | ✔           | ✔      | ✗          | ✗          | ✗            |
-| [lessOrEquals (\<=)](../../../sql-reference/functions/comparison-functions.md#lessorequals) | ✔           | ✔      | ✗          | ✗          | ✗            |
-| [greaterOrEquals (\>=)](../../../sql-reference/functions/comparison-functions.md#greaterorequals) | ✔           | ✔      | ✗          | ✗          | ✗            |
-| [empty](../../../sql-reference/functions/array-functions.md#function-empty) | ✔           | ✔      | ✗          | ✗          | ✗            |
-| [notEmpty](../../../sql-reference/functions/array-functions.md#function-notempty) | ✔           | ✔      | ✗          | ✗          | ✗            |
-| hasToken                                                     | ✗           | ✗      | ✗          | ✔          | ✗            |
-
-常量参数小于 ngram 大小的函数不能使用 `ngrambf_v1` 进行查询优化。
-
-:::note
-布隆过滤器可能会包含不符合条件的匹配，所以 `ngrambf_v1`, `tokenbf_v1` 和 `bloom_filter` 索引不能用于结果返回为假的函数，例如：
-
-- 可以用来优化的场景
-  - `s LIKE '%test%'`
-  - `NOT s NOT LIKE '%test%'`
-  - `s = 1`
-  - `NOT s != 1`
-  - `startsWith(s, 'test')`
-- 不能用来优化的场景
-  - `NOT s LIKE '%test%'`
-  - `s NOT LIKE '%test%'`
-  - `NOT s = 1`
-  - `s != 1`
-  - `NOT startsWith(s, 'test')`
-:::
-
-## 并发数据访问 {#concurrent-data-access}
-
-对于表的并发访问，我们使用多版本机制。换言之，当一张表同时被读和更新时，数据从当前查询到的一组片段中读取。没有冗长的的锁。插入不会阻碍读取。
-
-对表的读操作是自动并行的。
-
-## 列和表的 TTL {#table_engine-mergetree-ttl}
-
-TTL用于设置值的生命周期，它既可以为整张表设置，也可以为每个列字段单独设置。表级别的 TTL 还会指定数据在磁盘和卷上自动转移的逻辑。
-
-TTL 表达式的计算结果必须是 [日期](../../../engines/table-engines/mergetree-family/mergetree.md) 或 [日期时间](../../../engines/table-engines/mergetree-family/mergetree.md) 类型的字段。
-
-示例：
-
-``` sql
-TTL time_column
-TTL time_column + interval
-```
-
-要定义`interval`, 需要使用 [时间间隔](../../../engines/table-engines/mergetree-family/mergetree.md#operators-datetime) 操作符。
-
-``` sql
-TTL date_time + INTERVAL 1 MONTH
-TTL date_time + INTERVAL 15 HOUR
-```
-
-### 列 TTL {#mergetree-column-ttl}
-
-当列中的值过期时, ClickHouse会将它们替换成该列数据类型的默认值。如果数据片段中列的所有值均已过期，则ClickHouse 会从文件系统中的数据片段中删除此列。
-
-`TTL`子句不能被用于主键字段。
-
-**示例:**
-
-创建表时指定 `TTL`
-
-``` sql
-CREATE TABLE example_table
-(
-    d DateTime,
-    a Int TTL d + INTERVAL 1 MONTH,
-    b Int TTL d + INTERVAL 1 MONTH,
-    c String
-)
-ENGINE = MergeTree
-PARTITION BY toYYYYMM(d)
-ORDER BY d;
-```
-
-为表中已存在的列字段添加 `TTL`
-
-``` sql
-ALTER TABLE example_table
-    MODIFY COLUMN
-    c String TTL d + INTERVAL 1 DAY;
-```
-
-修改列字段的 `TTL`
-
-``` sql
-ALTER TABLE example_table
-    MODIFY COLUMN
-    c String TTL d + INTERVAL 1 MONTH;
-```
-
-### 表 TTL {#mergetree-table-ttl}
-
-表可以设置一个用于移除过期行的表达式，以及多个用于在磁盘或卷上自动转移数据片段的表达式。当表中的行过期时，ClickHouse 会删除所有对应的行。对于数据片段的转移特性，必须所有的行都满足转移条件。
-
-``` sql
-TTL expr
-    [DELETE|TO DISK 'xxx'|TO VOLUME 'xxx'][, DELETE|TO DISK 'aaa'|TO VOLUME 'bbb'] ...
-    [WHERE conditions]
-    [GROUP BY key_expr [SET v1 = aggr_func(v1) [, v2 = aggr_func(v2) ...]] ]
-
-```
-
-TTL 规则的类型紧跟在每个 TTL 表达式后面，它会影响满足表达式时（到达指定时间时）应当执行的操作：
-
-- `DELETE` - 删除过期的行（默认操作）;
-- `TO DISK 'aaa'` - 将数据片段移动到磁盘 `aaa`;
-- `TO VOLUME 'bbb'` - 将数据片段移动到卷 `bbb`.
-- `GROUP BY` - 聚合过期的行
-
-使用`WHERE`从句，您可以指定哪些过期的行会被删除或聚合(不适用于移动)。`GROUP BY`表达式必须是表主键的前缀。如果某列不是`GROUP BY`表达式的一部分，也没有在SET从句显示引用，结果行中相应列的值是随机的(就好像使用了`any`函数)。
-
-**示例**:
-
-创建时指定 TTL
-
-``` sql
-CREATE TABLE example_table
-(
-    d DateTime,
-    a Int
-)
-ENGINE = MergeTree
-PARTITION BY toYYYYMM(d)
-ORDER BY d
-TTL d + INTERVAL 1 MONTH DELETE,
-    d + INTERVAL 1 WEEK TO VOLUME 'aaa',
-    d + INTERVAL 2 WEEK TO DISK 'bbb';
-```
-
-修改表的 `TTL`
-
-``` sql
-ALTER TABLE example_table
-    MODIFY TTL d + INTERVAL 1 DAY;
-```
-
-创建一张表，设置一个月后数据过期，这些过期的行中日期为星期一的删除：
-
-``` sql
-CREATE TABLE table_with_where
-(
-    d DateTime,
-    a Int
-)
-ENGINE = MergeTree
-PARTITION BY toYYYYMM(d)
-ORDER BY d
-TTL d + INTERVAL 1 MONTH DELETE WHERE toDayOfWeek(d) = 1;
-```
-
-创建一张表，设置过期的列会被聚合。列`x`包含每组行中的最大值，`y`为最小值，`d`为可能任意值。
-
-``` sql
-CREATE TABLE table_for_aggregation
-(
-    d DateTime,
-    k1 Int,
-    k2 Int,
-    x Int,
-    y Int
-)
-ENGINE = MergeTree
-ORDER BY (k1, k2)
-TTL d + INTERVAL 1 MONTH GROUP BY k1, k2 SET x = max(x), y = min(y);
-```
-
-**删除数据**
-
-ClickHouse 在数据片段合并时会删除掉过期的数据。
-
-当ClickHouse发现数据过期时, 它将会执行一个计划外的合并。要控制这类合并的频率, 您可以设置 `merge_with_ttl_timeout`。如果该值被设置的太低, 它将引发大量计划外的合并，这可能会消耗大量资源。
-
-如果在两次合并的时间间隔中执行 `SELECT` 查询, 则可能会得到过期的数据。为了避免这种情况，可以在 `SELECT` 之前使用 [OPTIMIZE](../../../engines/table-engines/mergetree-family/mergetree.md#misc_operations-optimize) 。
-
-## 使用多个块设备进行数据存储 {#table_engine-mergetree-multiple-volumes}
-
-### 介绍 {#introduction}
-
-MergeTree 系列表引擎可以将数据存储在多个块设备上。这对某些可以潜在被划分为“冷”“热”的表来说是很有用的。最新数据被定期的查询但只需要很小的空间。相反，详尽的历史数据很少被用到。如果有多块磁盘可用，那么“热”的数据可以放置在快速的磁盘上（比如 NVMe 固态硬盘或内存），“冷”的数据可以放在相对较慢的磁盘上（比如机械硬盘）。
-
-数据片段是 `MergeTree` 引擎表的最小可移动单元。属于同一个数据片段的数据被存储在同一块磁盘上。数据片段会在后台自动的在磁盘间移动，也可以通过 [ALTER](../../../sql-reference/statements/alter.md#alter_move-partition) 查询来移动。
-
-### 术语 {#terms}
-
-- 磁盘 — 挂载到文件系统的块设备
-- 默认磁盘 — 在服务器设置中通过 [path](../../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-path) 参数指定的数据存储
-- 卷 — 相同磁盘的顺序列表 （类似于 [JBOD](https://en.wikipedia.org/wiki/Non-RAID_drive_architectures)）
-- 存储策略 — 卷的集合及他们之间的数据移动规则
-
- 以上名称的信息在Clickhouse中系统表[system.storage_policies](https://clickhouse.com/docs/zh/operations/system-tables/storage_policies/#system_tables-storage_policies)和[system.disks](https://clickhouse.com/docs/zh/operations/system-tables/disks/#system_tables-disks)体现。为了应用存储策略，可以在建表时使用`storage_policy`设置。
-
-### 配置 {#table_engine-mergetree-multiple-volumes_configure}
-
-磁盘、卷和存储策略应当在主配置文件 `config.xml` 或 `config.d` 目录中的独立文件中的 `<storage_configuration>` 标签内定义。
-
-配置结构：
-
-``` xml
-<storage_configuration>
-    <disks>
-        <disk_name_1> <!-- disk name -->
-            <path>/mnt/fast_ssd/clickhouse/</path>
-        </disk_name_1>
-        <disk_name_2>
-            <path>/mnt/hdd1/clickhouse/</path>
-            <keep_free_space_bytes>10485760</keep_free_space_bytes>
-        </disk_name_2>
-        <disk_name_3>
-            <path>/mnt/hdd2/clickhouse/</path>
-            <keep_free_space_bytes>10485760</keep_free_space_bytes>
-        </disk_name_3>
-
-        ...
-    </disks>
-
-    ...
-</storage_configuration>
-```
-
-标签：
-
-- `<disk_name_N>` — 磁盘名，名称必须与其他磁盘不同.
-- `path` — 服务器将用来存储数据 (`data` 和 `shadow` 目录) 的路径, 应当以 ‘/’ 结尾.
-- `keep_free_space_bytes` — 需要保留的剩余磁盘空间.
-
-磁盘定义的顺序无关紧要。
-
-存储策略配置：
-
-``` xml
-<storage_configuration>
-    ...
-    <policies>
-        <policy_name_1>
-            <volumes>
-                <volume_name_1>
-                    <disk>disk_name_from_disks_configuration</disk>
-                    <max_data_part_size_bytes>1073741824</max_data_part_size_bytes>
-                </volume_name_1>
-                <volume_name_2>
-                    <!-- configuration -->
-                </volume_name_2>
-                <!-- more volumes -->
-            </volumes>
-            <move_factor>0.2</move_factor>
-        </policy_name_1>
-        <policy_name_2>
-            <!-- configuration -->
-        </policy_name_2>
-
-        <!-- more policies -->
-    </policies>
-    ...
-</storage_configuration>
-```
-
-标签：
-
-- `policy_name_N` — 策略名称，不能重复。
-- `volume_name_N` — 卷名称，不能重复。
-- `disk` — 卷中的磁盘。
-- `max_data_part_size_bytes` — 卷中的磁盘可以存储的数据片段的最大大小。
-- `move_factor` — 当可用空间少于这个因子时，数据将自动的向下一个卷（如果有的话）移动 (默认值为 0.1)。
-- `prefer_not_to_merge` - 禁止在这个卷中进行数据合并。该选项启用时，对该卷的数据不能进行合并。这个选项主要用于慢速磁盘。
-
-配置示例：
-
-``` xml
-<storage_configuration>
-    ...
-    <policies>
-        <hdd_in_order> <!-- policy name -->
-            <volumes>
-                <single> <!-- volume name -->
-                    <disk>disk1</disk>
-                    <disk>disk2</disk>
-                </single>
-            </volumes>
-        </hdd_in_order>
-
-        <moving_from_ssd_to_hdd>
-            <volumes>
-                <hot>
-                    <disk>fast_ssd</disk>
-                    <max_data_part_size_bytes>1073741824</max_data_part_size_bytes>
-                </hot>
-                <cold>
-                    <disk>disk1</disk>
-                </cold>
-            </volumes>
-            <move_factor>0.2</move_factor>
-        </moving_from_ssd_to_hdd>
-
-        <small_jbod_with_external_no_merges>
-            <volumes>
-                <main>
-                    <disk>jbod1</disk>
-                </main>
-                <external>
-                    <disk>external</disk>
-                    <prefer_not_to_merge>true</prefer_not_to_merge>
-                </external>
-            </volumes>
-        </small_jbod_with_external_no_merges>
-    </policies>
-    ...
-</storage_configuration>
-```
-
-在给出的例子中， `hdd_in_order` 策略实现了 [循环制](https://zh.wikipedia.org/wiki/循环制) 方法。因此这个策略只定义了一个卷（`single`），数据片段会以循环的顺序全部存储到它的磁盘上。当有多个类似的磁盘挂载到系统上，但没有配置 RAID 时，这种策略非常有用。请注意一个每个独立的磁盘驱动都并不可靠，您可能需要用3份或更多的复制份数来补偿它。
-
-如果在系统中有不同类型的磁盘可用，可以使用  `moving_from_ssd_to_hdd`。`hot` 卷由 SSD 磁盘（`fast_ssd`）组成，这个卷上可以存储的数据片段的最大大小为 1GB。所有大于 1GB 的数据片段都会被直接存储到 `cold` 卷上，`cold` 卷包含一个名为 `disk1` 的 HDD 磁盘。
-同样，一旦 `fast_ssd` 被填充超过 80%，数据会通过后台进程向 `disk1` 进行转移。
-
-存储策略中卷的枚举顺序是很重要的。因为当一个卷被充满时，数据会向下一个卷转移。磁盘的枚举顺序同样重要，因为数据是依次存储在磁盘上的。
-
-在创建表时，可以应用存储策略：
-
-``` sql
-CREATE TABLE table_with_non_default_policy (
-    EventDate Date,
-    OrderID UInt64,
-    BannerID UInt64,
-    SearchPhrase String
-) ENGINE = MergeTree
-ORDER BY (OrderID, BannerID)
-PARTITION BY toYYYYMM(EventDate)
-SETTINGS storage_policy = 'moving_from_ssd_to_hdd'
-```
-
-`default` 存储策略意味着只使用一个卷，这个卷只包含一个在 `<path>` 中定义的磁盘。您可以使用[ALTER TABLE ... MODIFY SETTING]来修改存储策略，新的存储策略应该包含所有以前的磁盘和卷，并使用相同的名称。
-
-可以通过 [background_move_pool_size](../../../operations/server-configuration-parameters/settings.md#background_move_pool_size) 设置调整执行后台任务的线程数。
-
-### 详细说明 {#details}
-
-对于 `MergeTree` 表，数据通过以下不同的方式写入到磁盘当中：
-
-- 插入（`INSERT`查询）
-- 后台合并和[数据变异](../../../sql-reference/statements/alter.md#alter-mutations)
-- 从另一个副本下载
-- [ALTER TABLE … FREEZE PARTITION](../../../sql-reference/statements/alter.md#alter_freeze-partition) 冻结分区
-
-除了数据变异和冻结分区以外的情况下，数据按照以下逻辑存储到卷或磁盘上：
-
-1. 首个卷（按定义顺序）拥有足够的磁盘空间存储数据片段（`unreserved_space > current_part_size`）并且允许存储给定数据片段的大小（`max_data_part_size_bytes > current_part_size`）
-2. 在这个数据卷内，紧挨着先前存储数据的那块磁盘之后的磁盘，拥有比数据片段大的剩余空间。（`unreserved_space - keep_free_space_bytes > current_part_size`）
-
-更进一步，数据变异和分区冻结使用的是 [硬链接](https://en.wikipedia.org/wiki/Hard_link)。不同磁盘之间的硬链接是不支持的，所以在这种情况下数据片段都会被存储到原来的那一块磁盘上。
-
-在后台，数据片段基于剩余空间（`move_factor`参数）根据卷在配置文件中定义的顺序进行转移。数据永远不会从最后一个移出也不会从第一个移入。可以通过系统表 [system.part_log](../../../operations/system-tables/part_log.md#system_tables-part-log) (字段 `type = MOVE_PART`) 和 [system.parts](../../../operations/system-tables/parts.md#system_tables-parts) (字段 `path` 和 `disk`) 来监控后台的移动情况。具体细节可以通过服务器日志查看。
-
-用户可以通过 [ALTER TABLE … MOVE PART\|PARTITION … TO VOLUME\|DISK …](../../../sql-reference/statements/alter.md#alter_move-partition) 强制移动一个数据片段或分区到另外一个卷，所有后台移动的限制都会被考虑在内。这个查询会自行启动，无需等待后台操作完成。如果没有足够的可用空间或任何必须条件没有被满足，用户会收到报错信息。
-
-数据移动不会妨碍到数据复制。也就是说，同一张表的不同副本可以指定不同的存储策略。
-
-在后台合并和数据变异之后，旧的数据片段会在一定时间后被移除 (`old_parts_lifetime`)。在这期间，他们不能被移动到其他的卷或磁盘。也就是说，直到数据片段被完全移除，它们仍然会被磁盘占用空间计算在内。
-
-## 使用S3进行数据存储 {#using-s3-data-storage}
-
-`MergeTree`系列表引擎允许使用[S3](https://aws.amazon.com/s3/)存储数据，需要修改磁盘类型为`S3`。
-
-示例配置：
-
-``` xml
-<storage_configuration>
-    ...
-    <disks>
-        <s3>
-            <type>s3</type>
-            <endpoint>https://storage.yandexcloud.net/my-bucket/root-path/</endpoint>
-            <access_key_id>your_access_key_id</access_key_id>
-            <secret_access_key>your_secret_access_key</secret_access_key>
-            <region></region>
-            <server_side_encryption_customer_key_base64>your_base64_encoded_customer_key</server_side_encryption_customer_key_base64>
-            <proxy>
-                <uri>http://proxy1</uri>
-                <uri>http://proxy2</uri>
-            </proxy>
-            <connect_timeout_ms>10000</connect_timeout_ms>
-            <request_timeout_ms>5000</request_timeout_ms>
-            <retry_attempts>10</retry_attempts>
-            <single_read_retries>4</single_read_retries>
-            <min_bytes_for_seek>1000</min_bytes_for_seek>
-            <metadata_path>/var/lib/clickhouse/disks/s3/</metadata_path>
-            <skip_access_check>false</skip_access_check>
-        </s3>
-    </disks>
-    ...
-</storage_configuration>
-```
-
-必须的参数：
-
-- `endpoint` - S3的结点URL，以`path`或`virtual hosted`[格式](https://docs.aws.amazon.com/AmazonS3/latest/dev/VirtualHosting.html)书写。
-- `access_key_id` - S3的Access Key ID。
-- `secret_access_key` - S3的Secret Access Key。
-
-可选参数：
-
-- `region` - S3的区域名称
-- `use_environment_credentials` - 从环境变量AWS_ACCESS_KEY_ID、AWS_SECRET_ACCESS_KEY和AWS_SESSION_TOKEN中读取认证参数。默认值为`false`。
-- `use_insecure_imds_request` - 如果设置为`true`，S3客户端在认证时会使用不安全的IMDS请求。默认值为`false`。
-- `proxy` - 访问S3结点URL时代理设置。每一个`uri`项的值都应该是合法的代理URL。
-- `connect_timeout_ms` - Socket连接超时时间，默认值为`10000`，即10秒。
-- `request_timeout_ms` - 请求超时时间，默认值为`5000`，即5秒。
-- `retry_attempts` - 请求失败后的重试次数，默认值为10。
-- `single_read_retries` - 读过程中连接丢失后重试次数，默认值为4。
-- `min_bytes_for_seek` - 使用查找操作，而不是顺序读操作的最小字节数，默认值为1000。
-- `metadata_path` - 本地存放S3元数据文件的路径，默认值为`/var/lib/clickhouse/disks/<disk_name>/`
-- `skip_access_check` - 如果为`true`，Clickhouse启动时不检查磁盘是否可用。默认为`false`。
-- `server_side_encryption_customer_key_base64` - 如果指定该项的值，请求时会加上为了访问SSE-C加密数据而必须的头信息。
-
-S3磁盘也可以设置冷热存储：
-```xml
-<storage_configuration>
-    ...
-    <disks>
-        <s3>
-            <type>s3</type>
-            <endpoint>https://storage.yandexcloud.net/my-bucket/root-path/</endpoint>
-            <access_key_id>your_access_key_id</access_key_id>
-            <secret_access_key>your_secret_access_key</secret_access_key>
-        </s3>
-    </disks>
-    <policies>
-        <s3_main>
-            <volumes>
-                <main>
-                    <disk>s3</disk>
-                </main>
-            </volumes>
-        </s3_main>
-        <s3_cold>
-            <volumes>
-                <main>
-                    <disk>default</disk>
-                </main>
-                <external>
-                    <disk>s3</disk>
-                </external>
-            </volumes>
-            <move_factor>0.2</move_factor>
-        </s3_cold>
-    </policies>
-    ...
-</storage_configuration>
-```
-
-指定了`cold`选项后，本地磁盘剩余空间如果小于`move_factor * disk_size`，或有TTL设置时，数据就会定时迁移至S3了。
-
-## 虚拟列 {#virtual-columns}
-
--    `_part` - 分区名称。
--    `_part_index` - 作为请求的结果，按顺序排列的分区数。
--    `_partition_id` — 分区名称。
--    `_part_uuid` - 唯一部分标识符（如果 MergeTree 设置`assign_part_uuids` 已启用）。
--    `_partition_value` — `partition by` 表达式的值（元组）。
--    `_sample_factor` - 采样因子（来自请求）。
+---
+slug: /zh/engines/table-engines/mergetree-family/mergetree
+---
+# MergeTree {#table_engines-mergetree}
+
+Clickhouse 中最强大的表引擎当属 `MergeTree` （合并树）引擎及该系列（`*MergeTree`）中的其他引擎。
+
+`MergeTree` 系列的引擎被设计用于插入极大量的数据到一张表当中。数据可以以数据片段的形式一个接着一个的快速写入，数据片段在后台按照一定的规则进行合并。相比在插入时不断修改（重写）已存储的数据，这种策略会高效很多。
+
+主要特点:
+
+- 存储的数据按主键排序。
+
+    这使得您能够创建一个小型的稀疏索引来加快数据检索。
+
+- 如果指定了 [分区键](custom-partitioning-key.md) 的话，可以使用分区。
+
+    在相同数据集和相同结果集的情况下 ClickHouse 中某些带分区的操作会比普通操作更快。查询中指定了分区键时 ClickHouse 会自动截取分区数据。这也有效增加了查询性能。
+
+- 支持数据副本。
+
+    `ReplicatedMergeTree` 系列的表提供了数据副本功能。更多信息，请参阅 [数据副本](replication.md) 一节。
+
+- 支持数据采样。
+
+    需要的话，您可以给表设置一个采样方法。
+
+:::info
+[合并](../special/merge.md#merge) 引擎并不属于 `*MergeTree` 系列。
+:::
+
+## 建表 {#table_engine-mergetree-creating-a-table}
+
+``` sql
+CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
+(
+    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1] [TTL expr1],
+    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2] [TTL expr2],
+    ...
+    INDEX index_name1 expr1 TYPE type1(...) GRANULARITY value1,
+    INDEX index_name2 expr2 TYPE type2(...) GRANULARITY value2
+) ENGINE = MergeTree()
+ORDER BY expr
+[PARTITION BY expr]
+[PRIMARY KEY expr]
+[SAMPLE BY expr]
+[TTL expr [DELETE|TO DISK 'xxx'|TO VOLUME 'xxx'], ...]
+[SETTINGS name=value, ...]
+```
+
+对于以上参数的描述，可参考 [CREATE 语句 的描述](../../../engines/table-engines/mergetree-family/mergetree.md) 。
+
+<a name="mergetree-query-clauses"></a>
+
+**子句**
+
+- `ENGINE` - 引擎名和参数。 `ENGINE = MergeTree()`. `MergeTree` 引擎没有参数。
+
+- `ORDER BY` — 排序键。
+
+     可以是一组列的元组或任意的表达式。 例如: `ORDER BY (CounterID, EventDate)` 。
+
+     如果没有使用 `PRIMARY KEY` 显式指定的主键，ClickHouse 会使用排序键作为主键。
+
+     如果不需要排序，可以使用 `ORDER BY tuple()`. 参考 [选择主键](https://clickhouse.com/docs/en/engines/table-engines/mergetree-family/mergetree/#selecting-the-primary-key)
+
+- `PARTITION BY` — [分区键](custom-partitioning-key.md) ，可选项。
+
+     大多数情况下，不需要使用分区键。即使需要使用，也不需要使用比月更细粒度的分区键。分区不会加快查询（这与 ORDER BY 表达式不同）。永远也别使用过细粒度的分区键。不要使用客户端指定分区标识符或分区字段名称来对数据进行分区（而是将分区字段标识或名称作为 ORDER BY 表达式的第一列来指定分区）。
+
+     要按月分区，可以使用表达式 `toYYYYMM(date_column)` ，这里的 `date_column` 是一个 [Date](../../../engines/table-engines/mergetree-family/mergetree.md) 类型的列。分区名的格式会是 `"YYYYMM"` 。
+
+- `PRIMARY KEY` - 如果要 [选择与排序键不同的主键](#choosing-a-primary-key-that-differs-from-the-sorting-key)，在这里指定，可选项。
+
+    默认情况下主键跟排序键（由 `ORDER BY` 子句指定）相同。
+    因此，大部分情况下不需要再专门指定一个 `PRIMARY KEY` 子句。
+
+- `SAMPLE BY` - 用于抽样的表达式，可选项。
+
+     如果要用抽样表达式，主键中必须包含这个表达式。例如：
+     `SAMPLE BY intHash32(UserID) ORDER BY (CounterID, EventDate, intHash32(UserID))` 。
+
+- `TTL` - 指定行存储的持续时间并定义数据片段在硬盘和卷上的移动逻辑的规则列表，可选项。
+
+    表达式中必须存在至少一个 `Date` 或 `DateTime` 类型的列，比如：
+
+    `TTL date + INTERVAl 1 DAY`
+
+    规则的类型 `DELETE|TO DISK 'xxx'|TO VOLUME 'xxx'`指定了当满足条件（到达指定时间）时所要执行的动作：移除过期的行，还是将数据片段（如果数据片段中的所有行都满足表达式的话）移动到指定的磁盘（`TO DISK 'xxx'`) 或 卷（`TO VOLUME 'xxx'`）。默认的规则是移除（`DELETE`）。可以在列表中指定多个规则，但最多只能有一个`DELETE`的规则。
+
+    更多细节，请查看 [表和列的 TTL](#table_engine-mergetree-ttl)
+
+- `SETTINGS` — 控制 `MergeTree` 行为的额外参数，可选项：
+
+  - `index_granularity` — 索引粒度。索引中相邻的『标记』间的数据行数。默认值8192 。参考[数据存储](#mergetree-data-storage)。
+  - `index_granularity_bytes` — 索引粒度，以字节为单位，默认值: 10Mb。如果想要仅按数据行数限制索引粒度, 请设置为0(不建议)。
+  - `min_index_granularity_bytes` - 允许的最小数据粒度，默认值：1024b。该选项用于防止误操作，添加了一个非常低索引粒度的表。参考[数据存储](#mergetree-data-storage)
+  - `enable_mixed_granularity_parts` — 是否启用通过 `index_granularity_bytes` 控制索引粒度的大小。在19.11版本之前, 只有 `index_granularity` 配置能够用于限制索引粒度的大小。当从具有很大的行（几十上百兆字节）的表中查询数据时候，`index_granularity_bytes` 配置能够提升ClickHouse的性能。如果您的表里有很大的行，可以开启这项配置来提升`SELECT` 查询的性能。
+  - `use_minimalistic_part_header_in_zookeeper` — ZooKeeper中数据片段存储方式 。如果`use_minimalistic_part_header_in_zookeeper=1` ，ZooKeeper 会存储更少的数据。更多信息参考[服务配置参数]([Server Settings | ClickHouse Documentation](https://clickhouse.com/docs/zh/operations/server-configuration-parameters/settings/))这章中的 [设置描述](../../../operations/server-configuration-parameters/settings.md#server-settings-use_minimalistic_part_header_in_zookeeper) 。
+  - `min_merge_bytes_to_use_direct_io` — 使用直接 I/O 来操作磁盘的合并操作时要求的最小数据量。合并数据片段时，ClickHouse 会计算要被合并的所有数据的总存储空间。如果大小超过了 `min_merge_bytes_to_use_direct_io` 设置的字节数，则 ClickHouse 将使用直接 I/O 接口（`O_DIRECT` 选项）对磁盘读写。如果设置 `min_merge_bytes_to_use_direct_io = 0` ，则会禁用直接 I/O。默认值：`10 * 1024 * 1024 * 1024` 字节。
+        <a name="mergetree_setting-merge_with_ttl_timeout"></a>
+  - `merge_with_ttl_timeout` — TTL合并频率的最小间隔时间，单位：秒。默认值: 86400 (1 天)。
+  - `write_final_mark` — 是否启用在数据片段尾部写入最终索引标记。默认值: 1（不要关闭）。
+  - `merge_max_block_size` — 在块中进行合并操作时的最大行数限制。默认值：8192
+  - `storage_policy` — 存储策略。 参见 [使用具有多个块的设备进行数据存储](#table_engine-mergetree-multiple-volumes).
+  - `min_bytes_for_wide_part`,`min_rows_for_wide_part` 在数据片段中可以使用`Wide`格式进行存储的最小字节数/行数。您可以不设置、只设置一个，或全都设置。参考：[数据存储](#mergetree-data-storage)
+  - `max_parts_in_total` - 所有分区中最大块的数量(意义不明)
+  - `max_compress_block_size` - 在数据压缩写入表前，未压缩数据块的最大大小。您可以在全局设置中设置该值(参见[max_compress_block_size](https://clickhouse.com/docs/zh/operations/settings/settings/#max-compress-block-size))。建表时指定该值会覆盖全局设置。
+  - `min_compress_block_size` - 在数据压缩写入表前，未压缩数据块的最小大小。您可以在全局设置中设置该值(参见[min_compress_block_size](https://clickhouse.com/docs/zh/operations/settings/settings/#min-compress-block-size))。建表时指定该值会覆盖全局设置。
+  - `max_partitions_to_read` - 一次查询中可访问的分区最大数。您可以在全局设置中设置该值(参见[max_partitions_to_read](https://clickhouse.com/docs/zh/operations/settings/settings/#max_partitions_to_read))。
+
+**示例配置**
+
+``` sql
+ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate, intHash32(UserID)) SAMPLE BY intHash32(UserID) SETTINGS index_granularity=8192
+```
+
+在这个例子中，我们设置了按月进行分区。
+
+同时我们设置了一个按用户 ID 哈希的抽样表达式。这使得您可以对该表中每个 `CounterID` 和 `EventDate` 的数据伪随机分布。如果您在查询时指定了 [SAMPLE](../../../engines/table-engines/mergetree-family/mergetree.md#select-sample-clause) 子句。 ClickHouse会返回对于用户子集的一个均匀的伪随机数据采样。
+
+`index_granularity` 可省略因为 8192 是默认设置 。
+
+<details markdown="1">
+<summary>已弃用的建表方法</summary>
+
+:::attention "注意"
+不要在新版项目中使用该方法，可能的话，请将旧项目切换到上述方法。
+:::
+
+``` sql
+CREATE TABLE [IF NOT EXISTS] [db.]table_name [ON CLUSTER cluster]
+(
+    name1 [type1] [DEFAULT|MATERIALIZED|ALIAS expr1],
+    name2 [type2] [DEFAULT|MATERIALIZED|ALIAS expr2],
+    ...
+) ENGINE [=] MergeTree(date-column [, sampling_expression], (primary, key), index_granularity)
+```
+
+**MergeTree() 参数**
+
+- `date-column` — 类型为 [日期](../../../engines/table-engines/mergetree-family/mergetree.md) 的列名。ClickHouse 会自动依据这个列按月创建分区。分区名格式为 `"YYYYMM"` 。
+- `sampling_expression` — 采样表达式。
+- `(primary, key)` — 主键。类型 — [元组()](../../../engines/table-engines/mergetree-family/mergetree.md)
+- `index_granularity` — 索引粒度。即索引中相邻『标记』间的数据行数。设为 8192 可以适用大部分场景。
+
+**示例**
+
+    MergeTree(EventDate, intHash32(UserID), (CounterID, EventDate, intHash32(UserID)), 8192)
+
+对于主要的配置方法，这里 `MergeTree` 引擎跟前面的例子一样，可以以同样的方式配置。
+</details>
+
+## 数据存储 {#mergetree-data-storage}
+
+表由按主键排序的数据片段（DATA PART）组成。
+
+当数据被插入到表中时，会创建多个数据片段并按主键的字典序排序。例如，主键是 `(CounterID, Date)` 时，片段中数据首先按 `CounterID` 排序，具有相同 `CounterID` 的部分按 `Date` 排序。
+
+不同分区的数据会被分成不同的片段，ClickHouse 在后台合并数据片段以便更高效存储。不同分区的数据片段不会进行合并。合并机制并不保证具有相同主键的行全都合并到同一个数据片段中。
+
+数据片段可以以 `Wide` 或 `Compact` 格式存储。在 `Wide` 格式下，每一列都会在文件系统中存储为单独的文件，在 `Compact` 格式下所有列都存储在一个文件中。`Compact` 格式可以提高插入量少插入频率频繁时的性能。
+
+数据存储格式由 `min_bytes_for_wide_part` 和 `min_rows_for_wide_part` 表引擎参数控制。如果数据片段中的字节数或行数少于相应的设置值，数据片段会以 `Compact` 格式存储，否则会以 `Wide` 格式存储。
+
+每个数据片段被逻辑的分割成颗粒（granules）。颗粒是 ClickHouse 中进行数据查询时的最小不可分割数据集。ClickHouse 不会对行或值进行拆分，所以每个颗粒总是包含整数个行。每个颗粒的第一行通过该行的主键值进行标记，
+ClickHouse 会为每个数据片段创建一个索引文件来存储这些标记。对于每列，无论它是否包含在主键当中，ClickHouse 都会存储类似标记。这些标记让您可以在列文件中直接找到数据。
+
+颗粒的大小通过表引擎参数 `index_granularity` 和 `index_granularity_bytes` 控制。颗粒的行数的在 `[1, index_granularity]` 范围中，这取决于行的大小。如果单行的大小超过了 `index_granularity_bytes` 设置的值，那么一个颗粒的大小会超过 `index_granularity_bytes`。在这种情况下，颗粒的大小等于该行的大小。
+
+## 主键和索引在查询中的表现 {#primary-keys-and-indexes-in-queries}
+
+我们以 `(CounterID, Date)` 以主键。排序好的索引的图示会是下面这样：
+
+``` text
+    全部数据  :     [-------------------------------------------------------------------------]
+    CounterID:      [aaaaaaaaaaaaaaaaaabbbbcdeeeeeeeeeeeeefgggggggghhhhhhhhhiiiiiiiiikllllllll]
+    Date:           [1111111222222233331233211111222222333211111112122222223111112223311122333]
+    标记:            |      |      |      |      |      |      |      |      |      |      |
+                    a,1    a,2    a,3    b,3    e,2    e,3    g,1    h,2    i,1    i,3    l,3
+    标记号:          0      1      2      3      4      5      6      7      8      9      10
+```
+
+如果指定查询如下：
+
+- `CounterID in ('a', 'h')`，服务器会读取标记号在 `[0, 3)` 和 `[6, 8)` 区间中的数据。
+- `CounterID IN ('a', 'h') AND Date = 3`，服务器会读取标记号在 `[1, 3)` 和 `[7, 8)` 区间中的数据。
+- `Date = 3`，服务器会读取标记号在 `[1, 10]` 区间中的数据。
+
+上面例子可以看出使用索引通常会比全表描述要高效。
+
+稀疏索引会引起额外的数据读取。当读取主键单个区间范围的数据时，每个数据块中最多会多读 `index_granularity * 2` 行额外的数据。
+
+稀疏索引使得您可以处理极大量的行，因为大多数情况下，这些索引常驻于内存。
+
+ClickHouse 不要求主键唯一，所以您可以插入多条具有相同主键的行。
+
+您可以在`PRIMARY KEY`与`ORDER BY`条件中使用`可为空的`类型的表达式，但强烈建议不要这么做。为了启用这项功能，请打开[allow_nullable_key](../../../operations/settings/index.md#allow-nullable-key)，[NULLS_LAST](../../../sql-reference/statements/select/order-by.md#sorting-of-special-values)规则也适用于`ORDER BY`条件中有NULL值的情况下。
+
+### 主键的选择 {#zhu-jian-de-xuan-ze}
+
+主键中列的数量并没有明确的限制。依据数据结构，您可以在主键包含多些或少些列。这样可以：
+
+  - 改善索引的性能。
+
+  - 如果当前主键是 `(a, b)` ，在下列情况下添加另一个 `c` 列会提升性能：
+
+  - 查询会使用 `c` 列作为条件
+  - 很长的数据范围（ `index_granularity` 的数倍）里 `(a, b)` 都是相同的值，并且这样的情况很普遍。换言之，就是加入另一列后，可以让您的查询略过很长的数据范围。
+
+  - 改善数据压缩。
+
+    ClickHouse 以主键排序片段数据，所以，数据的一致性越高，压缩越好。
+
+  - 在[CollapsingMergeTree](collapsingmergetree.md#table_engine-collapsingmergetree) 和 [SummingMergeTree](summingmergetree.md) 引擎里进行数据合并时会提供额外的处理逻辑。
+
+    在这种情况下，指定与主键不同的 *排序键* 也是有意义的。
+
+长的主键会对插入性能和内存消耗有负面影响，但主键中额外的列并不影响 `SELECT` 查询的性能。
+
+可以使用 `ORDER BY tuple()` 语法创建没有主键的表。在这种情况下 ClickHouse 根据数据插入的顺序存储。如果在使用 `INSERT ... SELECT` 时希望保持数据的排序，请设置 [max_insert_threads = 1](../../../operations/settings/settings.md#settings-max-insert-threads)。
+
+想要根据初始顺序进行数据查询，使用 [单线程查询](../../../operations/settings/settings.md#settings-max_threads)
+
+### 选择与排序键不同的主键 {#choosing-a-primary-key-that-differs-from-the-sorting-key}
+
+Clickhouse可以做到指定一个跟排序键不一样的主键，此时排序键用于在数据片段中进行排序，主键用于在索引文件中进行标记的写入。这种情况下，主键表达式元组必须是排序键表达式元组的前缀(即主键为(a,b)，排序列必须为(a,b,******))。
+
+当使用 [SummingMergeTree](summingmergetree.md) 和 [AggregatingMergeTree](aggregatingmergetree.md) 引擎时，这个特性非常有用。通常在使用这类引擎时，表里的列分两种：*维度* 和 *度量* 。典型的查询会通过任意的 `GROUP BY` 对度量列进行聚合并通过维度列进行过滤。由于 SummingMergeTree 和 AggregatingMergeTree 会对排序键相同的行进行聚合，所以把所有的维度放进排序键是很自然的做法。但这将导致排序键中包含大量的列，并且排序键会伴随着新添加的维度不断的更新。
+
+在这种情况下合理的做法是，只保留少量的列在主键当中用于提升扫描效率，将维度列添加到排序键中。
+
+对排序键进行 [ALTER](../../../sql-reference/statements/alter.md) 是轻量级的操作，因为当一个新列同时被加入到表里和排序键里时，已存在的数据片段并不需要修改。由于旧的排序键是新排序键的前缀，并且新添加的列中没有数据，因此在表修改时的数据对于新旧的排序键来说都是有序的。
+
+### 索引和分区在查询中的应用 {#use-of-indexes-and-partitions-in-queries}
+
+对于 `SELECT` 查询，ClickHouse 分析是否可以使用索引。如果 `WHERE/PREWHERE` 子句具有下面这些表达式（作为完整WHERE条件的一部分或全部）则可以使用索引：进行相等/不相等的比较；对主键列或分区列进行`IN`运算、有固定前缀的`LIKE`运算(如name like 'test%')、函数运算(部分函数适用)，还有对上述表达式进行逻辑运算。
+
+
+因此，在索引键的一个或多个区间上快速地执行查询是可能的。下面例子中，指定标签；指定标签和日期范围；指定标签和日期；指定多个标签和日期范围等执行查询，都会非常快。
+
+当引擎配置如下时：
+
+``` sql
+    ENGINE MergeTree() PARTITION BY toYYYYMM(EventDate) ORDER BY (CounterID, EventDate) SETTINGS index_granularity=8192
+```
+
+这种情况下，这些查询：
+
+``` sql
+SELECT count() FROM table WHERE EventDate = toDate(now()) AND CounterID = 34
+SELECT count() FROM table WHERE EventDate = toDate(now()) AND (CounterID = 34 OR CounterID = 42)
+SELECT count() FROM table WHERE ((EventDate >= toDate('2014-01-01') AND EventDate <= toDate('2014-01-31')) OR EventDate = toDate('2014-05-01')) AND CounterID IN (101500, 731962, 160656) AND (CounterID = 101500 OR EventDate != toDate('2014-05-01'))
+```
+
+ClickHouse 会依据主键索引剪掉不符合的数据，依据按月分区的分区键剪掉那些不包含符合数据的分区。
+
+上文的查询显示，即使索引用于复杂表达式，因为读表操作经过优化，所以使用索引不会比完整扫描慢。
+
+下面这个例子中，不会使用索引。
+
+``` sql
+SELECT count() FROM table WHERE CounterID = 34 OR URL LIKE '%upyachka%'
+```
+
+要检查 ClickHouse 执行一个查询时能否使用索引，可设置 [force_index_by_date](../../../operations/settings/settings.md#settings-force_index_by_date) 和 [force_primary_key](../../../operations/settings/settings.md) 。
+
+使用按月分区的分区列允许只读取包含适当日期区间的数据块，这种情况下，数据块会包含很多天（最多整月）的数据。在块中，数据按主键排序，主键第一列可能不包含日期。因此，仅使用日期而没有用主键字段作为条件的查询将会导致需要读取超过这个指定日期以外的数据。
+
+### 部分单调主键的使用
+
+考虑这样的场景，比如一个月中的天数。它们在一个月的范围内形成一个[单调序列](https://zh.wikipedia.org/wiki/单调函数) ，但如果扩展到更大的时间范围它们就不再单调了。这就是一个部分单调序列。如果用户使用部分单调的主键创建表，ClickHouse同样会创建一个稀疏索引。当用户从这类表中查询数据时，ClickHouse 会对查询条件进行分析。如果用户希望获取两个索引标记之间的数据并且这两个标记在一个月以内，ClickHouse 可以在这种特殊情况下使用到索引，因为它可以计算出查询参数与索引标记之间的距离。
+
+如果查询参数范围内的主键不是单调序列，那么 ClickHouse 无法使用索引。在这种情况下，ClickHouse 会进行全表扫描。
+
+ClickHouse 在任何主键代表一个部分单调序列的情况下都会使用这个逻辑。
+
+### 跳数索引 {#tiao-shu-suo-yin-fen-duan-hui-zong-suo-yin-shi-yan-xing-de}
+
+此索引在 `CREATE` 语句的列部分里定义。
+
+``` sql
+INDEX index_name expr TYPE type(...) GRANULARITY granularity_value
+```
+
+`*MergeTree` 系列的表可以指定跳数索引。
+跳数索引是指数据片段按照粒度(建表时指定的`index_granularity`)分割成小块后，将上述SQL的granularity_value数量的小块组合成一个大的块，对这些大块写入索引信息，这样有助于使用`where`筛选时跳过大量不必要的数据，减少`SELECT`需要读取的数据量。
+
+**示例**
+
+``` sql
+CREATE TABLE table_name
+(
+    u64 UInt64,
+    i32 Int32,
+    s String,
+    ...
+    INDEX a (u64 * i32, s) TYPE minmax GRANULARITY 3,
+    INDEX b (u64 * length(s)) TYPE set(1000) GRANULARITY 4
+) ENGINE = MergeTree()
+...
+```
+
+上例中的索引能让 ClickHouse 执行下面这些查询时减少读取数据量。
+
+``` sql
+SELECT count() FROM table WHERE s < 'z'
+SELECT count() FROM table WHERE u64 * i32 == 10 AND u64 * length(s) >= 1234
+```
+
+#### 可用的索引类型 {#table_engine-mergetree-data_skipping-indexes}
+
+- `minmax`
+    存储指定表达式的极值（如果表达式是 `tuple` ，则存储 `tuple` 中每个元素的极值），这些信息用于跳过数据块，类似主键。
+
+- `set(max_rows)`
+    存储指定表达式的不重复值（不超过 `max_rows` 个，`max_rows=0` 则表示『无限制』）。这些信息可用于检查数据块是否满足 `WHERE` 条件。
+
+- `ngrambf_v1(n, size_of_bloom_filter_in_bytes, number_of_hash_functions, random_seed)`
+    存储一个包含数据块中所有 n元短语（ngram） 的 [布隆过滤器](https://en.wikipedia.org/wiki/Bloom_filter) 。只可用在字符串上。
+    可用于优化 `equals` ， `like` 和 `in` 表达式的性能。
+  - `n` – 短语长度。
+  - `size_of_bloom_filter_in_bytes` – 布隆过滤器大小，字节为单位。（因为压缩得好，可以指定比较大的值，如 256 或 512）。
+  - `number_of_hash_functions` – 布隆过滤器中使用的哈希函数的个数。
+  - `random_seed` – 哈希函数的随机种子。
+
+- `tokenbf_v1(size_of_bloom_filter_in_bytes, number_of_hash_functions, random_seed)`
+    跟 `ngrambf_v1` 类似，但是存储的是token而不是ngrams。Token是由非字母数字的符号分割的序列。
+
+- `bloom_filter(bloom_filter([false_positive])` – 为指定的列存储布隆过滤器
+
+    可选参数`false_positive`用来指定从布隆过滤器收到错误响应的几率。取值范围是 (0,1)，默认值：0.025
+
+    支持的数据类型：`Int*`, `UInt*`, `Float*`, `Enum`, `Date`, `DateTime`, `String`, `FixedString`, `Array`, `LowCardinality`, `Nullable`。
+
+    以下函数会用到这个索引： [equals](../../../sql-reference/functions/comparison-functions.md), [notEquals](../../../sql-reference/functions/comparison-functions.md), [in](../../../sql-reference/functions/in-functions.md), [notIn](../../../sql-reference/functions/in-functions.md), [has](../../../sql-reference/functions/array-functions.md)
+
+``` sql
+INDEX sample_index (u64 * length(s)) TYPE minmax GRANULARITY 4
+INDEX sample_index2 (u64 * length(str), i32 + f64 * 100, date, str) TYPE set(100) GRANULARITY 4
+INDEX sample_index3 (lower(str), str) TYPE ngrambf_v1(3, 256, 2, 0) GRANULARITY 4
+```
+
+#### 函数支持 {#functions-support}
+
+WHERE 子句中的条件可以包含对某列数据进行运算的函数表达式，如果列是索引的一部分，ClickHouse会在执行函数时尝试使用索引。不同的函数对索引的支持是不同的。
+
+`set` 索引会对所有函数生效，其他索引对函数的生效情况见下表
+
+| 函数 (操作符) / 索引                                         | primary key | minmax | ngrambf_v1 | tokenbf_v1 | bloom_filter |
+| ------------------------------------------------------------ | ----------- | ------ | ---------- | ---------- | ------------ |
+| [equals (=, ==)](../../../sql-reference/functions/comparison-functions.md#equals) | ✔           | ✔      | ✔          | ✔          | ✔            |
+| [notEquals(!=, &lt;&gt;)](../../../sql-reference/functions/comparison-functions.md#notequals) | ✔           | ✔      | ✔          | ✔          | ✔            |
+| [like](../../../sql-reference/functions/string-search-functions.md#function-like) | ✔           | ✔      | ✔          | ✔          | ✔            |
+| [notLike](../../../sql-reference/functions/string-search-functions.md#function-notlike) | ✔           | ✔      | ✗          | ✗          | ✗            |
+| [startsWith](../../../sql-reference/functions/string-functions.md#startswith) | ✔           | ✔      | ✔          | ✔          | ✗            |
+| [endsWith](../../../sql-reference/functions/string-functions.md#endswith) | ✗           | ✗      | ✔          | ✔          | ✗            |
+| [multiSearchAny](../../../sql-reference/functions/string-search-functions.md#function-multisearchany) | ✗           | ✗      | ✔          | ✗          | ✗            |
+| [in](../../../sql-reference/functions/in-functions.md#in-functions) | ✔           | ✔      | ✔          | ✔          | ✔            |
+| [notIn](../../../sql-reference/functions/in-functions.md#in-functions) | ✔           | ✔      | ✔          | ✔          | ✔            |
+| [less (\<)](../../../sql-reference/functions/comparison-functions.md#less) | ✔           | ✔      | ✗          | ✗          | ✗            |
+| [greater (\>)](../../../sql-reference/functions/comparison-functions.md#greater) | ✔           | ✔      | ✗          | ✗          | ✗            |
+| [lessOrEquals (\<=)](../../../sql-reference/functions/comparison-functions.md#lessorequals) | ✔           | ✔      | ✗          | ✗          | ✗            |
+| [greaterOrEquals (\>=)](../../../sql-reference/functions/comparison-functions.md#greaterorequals) | ✔           | ✔      | ✗          | ✗          | ✗            |
+| [empty](../../../sql-reference/functions/array-functions.md#function-empty) | ✔           | ✔      | ✗          | ✗          | ✗            |
+| [notEmpty](../../../sql-reference/functions/array-functions.md#function-notempty) | ✔           | ✔      | ✗          | ✗          | ✗            |
+| [has](../../../sql-reference/functions/array-functions.md#function-has)                                       | ✗           | ✗      | ✔          | ✔          | ✔            | ✔        |
+| [hasAny](../../../sql-reference/functions/array-functions.md#function-hasAny)                                 | ✗           | ✗      | ✔          | ✔          | ✔            | ✗        |
+| [hasAll](../../../sql-reference/functions/array-functions.md#function-hasAll)                                 | ✗           | ✗      | ✗          | ✗          | ✔            | ✗        |
+| hasToken                                                     | ✗           | ✗      | ✗          | ✔          | ✗            |
+
+常量参数小于 ngram 大小的函数不能使用 `ngrambf_v1` 进行查询优化。
+
+:::note
+布隆过滤器可能会包含不符合条件的匹配，所以 `ngrambf_v1`, `tokenbf_v1` 和 `bloom_filter` 索引不能用于结果返回为假的函数，例如：
+
+- 可以用来优化的场景
+  - `s LIKE '%test%'`
+  - `NOT s NOT LIKE '%test%'`
+  - `s = 1`
+  - `NOT s != 1`
+  - `startsWith(s, 'test')`
+- 不能用来优化的场景
+  - `NOT s LIKE '%test%'`
+  - `s NOT LIKE '%test%'`
+  - `NOT s = 1`
+  - `s != 1`
+  - `NOT startsWith(s, 'test')`
+:::
+
+## 并发数据访问 {#concurrent-data-access}
+
+对于表的并发访问，我们使用多版本机制。换言之，当一张表同时被读和更新时，数据从当前查询到的一组片段中读取。没有冗长的的锁。插入不会阻碍读取。
+
+对表的读操作是自动并行的。
+
+## 列和表的 TTL {#table_engine-mergetree-ttl}
+
+TTL用于设置值的生命周期，它既可以为整张表设置，也可以为每个列字段单独设置。表级别的 TTL 还会指定数据在磁盘和卷上自动转移的逻辑。
+
+TTL 表达式的计算结果必须是 [日期](../../../engines/table-engines/mergetree-family/mergetree.md) 或 [日期时间](../../../engines/table-engines/mergetree-family/mergetree.md) 类型的字段。
+
+示例：
+
+``` sql
+TTL time_column
+TTL time_column + interval
+```
+
+要定义`interval`, 需要使用 [时间间隔](../../../engines/table-engines/mergetree-family/mergetree.md#operators-datetime) 操作符。
+
+``` sql
+TTL date_time + INTERVAL 1 MONTH
+TTL date_time + INTERVAL 15 HOUR
+```
+
+### 列 TTL {#mergetree-column-ttl}
+
+当列中的值过期时, ClickHouse会将它们替换成该列数据类型的默认值。如果数据片段中列的所有值均已过期，则ClickHouse 会从文件系统中的数据片段中删除此列。
+
+`TTL`子句不能被用于主键字段。
+
+**示例:**
+
+创建表时指定 `TTL`
+
+``` sql
+CREATE TABLE example_table
+(
+    d DateTime,
+    a Int TTL d + INTERVAL 1 MONTH,
+    b Int TTL d + INTERVAL 1 MONTH,
+    c String
+)
+ENGINE = MergeTree
+PARTITION BY toYYYYMM(d)
+ORDER BY d;
+```
+
+为表中已存在的列字段添加 `TTL`
+
+``` sql
+ALTER TABLE example_table
+    MODIFY COLUMN
+    c String TTL d + INTERVAL 1 DAY;
+```
+
+修改列字段的 `TTL`
+
+``` sql
+ALTER TABLE example_table
+    MODIFY COLUMN
+    c String TTL d + INTERVAL 1 MONTH;
+```
+
+### 表 TTL {#mergetree-table-ttl}
+
+表可以设置一个用于移除过期行的表达式，以及多个用于在磁盘或卷上自动转移数据片段的表达式。当表中的行过期时，ClickHouse 会删除所有对应的行。对于数据片段的转移特性，必须所有的行都满足转移条件。
+
+``` sql
+TTL expr
+    [DELETE|TO DISK 'xxx'|TO VOLUME 'xxx'][, DELETE|TO DISK 'aaa'|TO VOLUME 'bbb'] ...
+    [WHERE conditions]
+    [GROUP BY key_expr [SET v1 = aggr_func(v1) [, v2 = aggr_func(v2) ...]] ]
+
+```
+
+TTL 规则的类型紧跟在每个 TTL 表达式后面，它会影响满足表达式时（到达指定时间时）应当执行的操作：
+
+- `DELETE` - 删除过期的行（默认操作）;
+- `TO DISK 'aaa'` - 将数据片段移动到磁盘 `aaa`;
+- `TO VOLUME 'bbb'` - 将数据片段移动到卷 `bbb`.
+- `GROUP BY` - 聚合过期的行
+
+使用`WHERE`从句，您可以指定哪些过期的行会被删除或聚合(不适用于移动)。`GROUP BY`表达式必须是表主键的前缀。如果某列不是`GROUP BY`表达式的一部分，也没有在SET从句显示引用，结果行中相应列的值是随机的(就好像使用了`any`函数)。
+
+**示例**:
+
+创建时指定 TTL
+
+``` sql
+CREATE TABLE example_table
+(
+    d DateTime,
+    a Int
+)
+ENGINE = MergeTree
+PARTITION BY toYYYYMM(d)
+ORDER BY d
+TTL d + INTERVAL 1 MONTH DELETE,
+    d + INTERVAL 1 WEEK TO VOLUME 'aaa',
+    d + INTERVAL 2 WEEK TO DISK 'bbb';
+```
+
+修改表的 `TTL`
+
+``` sql
+ALTER TABLE example_table
+    MODIFY TTL d + INTERVAL 1 DAY;
+```
+
+创建一张表，设置一个月后数据过期，这些过期的行中日期为星期一的删除：
+
+``` sql
+CREATE TABLE table_with_where
+(
+    d DateTime,
+    a Int
+)
+ENGINE = MergeTree
+PARTITION BY toYYYYMM(d)
+ORDER BY d
+TTL d + INTERVAL 1 MONTH DELETE WHERE toDayOfWeek(d) = 1;
+```
+
+创建一张表，设置过期的列会被聚合。列`x`包含每组行中的最大值，`y`为最小值，`d`为可能任意值。
+
+``` sql
+CREATE TABLE table_for_aggregation
+(
+    d DateTime,
+    k1 Int,
+    k2 Int,
+    x Int,
+    y Int
+)
+ENGINE = MergeTree
+ORDER BY (k1, k2)
+TTL d + INTERVAL 1 MONTH GROUP BY k1, k2 SET x = max(x), y = min(y);
+```
+
+**删除数据**
+
+ClickHouse 在数据片段合并时会删除掉过期的数据。
+
+当ClickHouse发现数据过期时, 它将会执行一个计划外的合并。要控制这类合并的频率, 您可以设置 `merge_with_ttl_timeout`。如果该值被设置的太低, 它将引发大量计划外的合并，这可能会消耗大量资源。
+
+如果在两次合并的时间间隔中执行 `SELECT` 查询, 则可能会得到过期的数据。为了避免这种情况，可以在 `SELECT` 之前使用 [OPTIMIZE](../../../engines/table-engines/mergetree-family/mergetree.md#misc_operations-optimize) 。
+
+## 使用多个块设备进行数据存储 {#table_engine-mergetree-multiple-volumes}
+
+### 介绍 {#introduction}
+
+MergeTree 系列表引擎可以将数据存储在多个块设备上。这对某些可以潜在被划分为“冷”“热”的表来说是很有用的。最新数据被定期的查询但只需要很小的空间。相反，详尽的历史数据很少被用到。如果有多块磁盘可用，那么“热”的数据可以放置在快速的磁盘上（比如 NVMe 固态硬盘或内存），“冷”的数据可以放在相对较慢的磁盘上（比如机械硬盘）。
+
+数据片段是 `MergeTree` 引擎表的最小可移动单元。属于同一个数据片段的数据被存储在同一块磁盘上。数据片段会在后台自动的在磁盘间移动，也可以通过 [ALTER](../../../sql-reference/statements/alter.md#alter_move-partition) 查询来移动。
+
+### 术语 {#terms}
+
+- 磁盘 — 挂载到文件系统的块设备
+- 默认磁盘 — 在服务器设置中通过 [path](../../../operations/server-configuration-parameters/settings.md#server_configuration_parameters-path) 参数指定的数据存储
+- 卷 — 相同磁盘的顺序列表 （类似于 [JBOD](https://en.wikipedia.org/wiki/Non-RAID_drive_architectures)）
+- 存储策略 — 卷的集合及他们之间的数据移动规则
+
+ 以上名称的信息在Clickhouse中系统表[system.storage_policies](https://clickhouse.com/docs/zh/operations/system-tables/storage_policies/#system_tables-storage_policies)和[system.disks](https://clickhouse.com/docs/zh/operations/system-tables/disks/#system_tables-disks)体现。为了应用存储策略，可以在建表时使用`storage_policy`设置。
+
+### 配置 {#table_engine-mergetree-multiple-volumes_configure}
+
+磁盘、卷和存储策略应当在主配置文件 `config.xml` 或 `config.d` 目录中的独立文件中的 `<storage_configuration>` 标签内定义。
+
+配置结构：
+
+``` xml
+<storage_configuration>
+    <disks>
+        <disk_name_1> <!-- disk name -->
+            <path>/mnt/fast_ssd/clickhouse/</path>
+        </disk_name_1>
+        <disk_name_2>
+            <path>/mnt/hdd1/clickhouse/</path>
+            <keep_free_space_bytes>10485760</keep_free_space_bytes>
+        </disk_name_2>
+        <disk_name_3>
+            <path>/mnt/hdd2/clickhouse/</path>
+            <keep_free_space_bytes>10485760</keep_free_space_bytes>
+        </disk_name_3>
+
+        ...
+    </disks>
+
+    ...
+</storage_configuration>
+```
+
+标签：
+
+- `<disk_name_N>` — 磁盘名，名称必须与其他磁盘不同.
+- `path` — 服务器将用来存储数据 (`data` 和 `shadow` 目录) 的路径, 应当以 ‘/’ 结尾.
+- `keep_free_space_bytes` — 需要保留的剩余磁盘空间.
+
+磁盘定义的顺序无关紧要。
+
+存储策略配置：
+
+``` xml
+<storage_configuration>
+    ...
+    <policies>
+        <policy_name_1>
+            <volumes>
+                <volume_name_1>
+                    <disk>disk_name_from_disks_configuration</disk>
+                    <max_data_part_size_bytes>1073741824</max_data_part_size_bytes>
+                </volume_name_1>
+                <volume_name_2>
+                    <!-- configuration -->
+                </volume_name_2>
+                <!-- more volumes -->
+            </volumes>
+            <move_factor>0.2</move_factor>
+        </policy_name_1>
+        <policy_name_2>
+            <!-- configuration -->
+        </policy_name_2>
+
+        <!-- more policies -->
+    </policies>
+    ...
+</storage_configuration>
+```
+
+标签：
+
+- `policy_name_N` — 策略名称，不能重复。
+- `volume_name_N` — 卷名称，不能重复。
+- `disk` — 卷中的磁盘。
+- `max_data_part_size_bytes` — 卷中的磁盘可以存储的数据片段的最大大小。
+- `move_factor` — 当可用空间少于这个因子时，数据将自动的向下一个卷（如果有的话）移动 (默认值为 0.1)。
+
+配置示例：
+
+``` xml
+<storage_configuration>
+    ...
+    <policies>
+        <hdd_in_order> <!-- policy name -->
+            <volumes>
+                <single> <!-- volume name -->
+                    <disk>disk1</disk>
+                    <disk>disk2</disk>
+                </single>
+            </volumes>
+        </hdd_in_order>
+
+        <moving_from_ssd_to_hdd>
+            <volumes>
+                <hot>
+                    <disk>fast_ssd</disk>
+                    <max_data_part_size_bytes>1073741824</max_data_part_size_bytes>
+                </hot>
+                <cold>
+                    <disk>disk1</disk>
+                </cold>
+            </volumes>
+            <move_factor>0.2</move_factor>
+        </moving_from_ssd_to_hdd>
+
+        <small_jbod_with_external_no_merges>
+            <volumes>
+                <main>
+                    <disk>jbod1</disk>
+                </main>
+                <external>
+                    <disk>external</disk>
+                </external>
+            </volumes>
+        </small_jbod_with_external_no_merges>
+    </policies>
+    ...
+</storage_configuration>
+```
+
+在给出的例子中， `hdd_in_order` 策略实现了 [循环制](https://zh.wikipedia.org/wiki/循环制) 方法。因此这个策略只定义了一个卷（`single`），数据片段会以循环的顺序全部存储到它的磁盘上。当有多个类似的磁盘挂载到系统上，但没有配置 RAID 时，这种策略非常有用。请注意一个每个独立的磁盘驱动都并不可靠，您可能需要用3份或更多的复制份数来补偿它。
+
+如果在系统中有不同类型的磁盘可用，可以使用  `moving_from_ssd_to_hdd`。`hot` 卷由 SSD 磁盘（`fast_ssd`）组成，这个卷上可以存储的数据片段的最大大小为 1GB。所有大于 1GB 的数据片段都会被直接存储到 `cold` 卷上，`cold` 卷包含一个名为 `disk1` 的 HDD 磁盘。
+同样，一旦 `fast_ssd` 被填充超过 80%，数据会通过后台进程向 `disk1` 进行转移。
+
+存储策略中卷的枚举顺序是很重要的。因为当一个卷被充满时，数据会向下一个卷转移。磁盘的枚举顺序同样重要，因为数据是依次存储在磁盘上的。
+
+在创建表时，可以应用存储策略：
+
+``` sql
+CREATE TABLE table_with_non_default_policy (
+    EventDate Date,
+    OrderID UInt64,
+    BannerID UInt64,
+    SearchPhrase String
+) ENGINE = MergeTree
+ORDER BY (OrderID, BannerID)
+PARTITION BY toYYYYMM(EventDate)
+SETTINGS storage_policy = 'moving_from_ssd_to_hdd'
+```
+
+`default` 存储策略意味着只使用一个卷，这个卷只包含一个在 `<path>` 中定义的磁盘。您可以使用[ALTER TABLE ... MODIFY SETTING]来修改存储策略，新的存储策略应该包含所有以前的磁盘和卷，并使用相同的名称。
+
+可以通过 [background_move_pool_size](../../../operations/server-configuration-parameters/settings.md#background_move_pool_size) 设置调整执行后台任务的线程数。
+
+### 详细说明 {#details}
+
+对于 `MergeTree` 表，数据通过以下不同的方式写入到磁盘当中：
+
+- 插入（`INSERT`查询）
+- 后台合并和[数据变异](../../../sql-reference/statements/alter.md#alter-mutations)
+- 从另一个副本下载
+- [ALTER TABLE … FREEZE PARTITION](../../../sql-reference/statements/alter.md#alter_freeze-partition) 冻结分区
+
+除了数据变异和冻结分区以外的情况下，数据按照以下逻辑存储到卷或磁盘上：
+
+1. 首个卷（按定义顺序）拥有足够的磁盘空间存储数据片段（`unreserved_space > current_part_size`）并且允许存储给定数据片段的大小（`max_data_part_size_bytes > current_part_size`）
+2. 在这个数据卷内，紧挨着先前存储数据的那块磁盘之后的磁盘，拥有比数据片段大的剩余空间。（`unreserved_space - keep_free_space_bytes > current_part_size`）
+
+更进一步，数据变异和分区冻结使用的是 [硬链接](https://en.wikipedia.org/wiki/Hard_link)。不同磁盘之间的硬链接是不支持的，所以在这种情况下数据片段都会被存储到原来的那一块磁盘上。
+
+在后台，数据片段基于剩余空间（`move_factor`参数）根据卷在配置文件中定义的顺序进行转移。数据永远不会从最后一个移出也不会从第一个移入。可以通过系统表 [system.part_log](../../../operations/system-tables/part_log.md#system_tables-part-log) (字段 `type = MOVE_PART`) 和 [system.parts](../../../operations/system-tables/parts.md#system_tables-parts) (字段 `path` 和 `disk`) 来监控后台的移动情况。具体细节可以通过服务器日志查看。
+
+用户可以通过 [ALTER TABLE … MOVE PART\|PARTITION … TO VOLUME\|DISK …](../../../sql-reference/statements/alter.md#alter_move-partition) 强制移动一个数据片段或分区到另外一个卷，所有后台移动的限制都会被考虑在内。这个查询会自行启动，无需等待后台操作完成。如果没有足够的可用空间或任何必须条件没有被满足，用户会收到报错信息。
+
+数据移动不会妨碍到数据复制。也就是说，同一张表的不同副本可以指定不同的存储策略。
+
+在后台合并和数据变异之后，旧的数据片段会在一定时间后被移除 (`old_parts_lifetime`)。在这期间，他们不能被移动到其他的卷或磁盘。也就是说，直到数据片段被完全移除，它们仍然会被磁盘占用空间计算在内。
+
+## 使用S3进行数据存储 {#using-s3-data-storage}
+
+`MergeTree`系列表引擎允许使用[S3](https://aws.amazon.com/s3/)存储数据，需要修改磁盘类型为`S3`。
+
+示例配置：
+
+``` xml
+<storage_configuration>
+    ...
+    <disks>
+        <s3>
+            <type>s3</type>
+            <endpoint>https://storage.yandexcloud.net/my-bucket/root-path/</endpoint>
+            <access_key_id>your_access_key_id</access_key_id>
+            <secret_access_key>your_secret_access_key</secret_access_key>
+            <region></region>
+            <server_side_encryption_customer_key_base64>your_base64_encoded_customer_key</server_side_encryption_customer_key_base64>
+            <proxy>
+                <uri>http://proxy1</uri>
+                <uri>http://proxy2</uri>
+            </proxy>
+            <connect_timeout_ms>10000</connect_timeout_ms>
+            <request_timeout_ms>5000</request_timeout_ms>
+            <retry_attempts>10</retry_attempts>
+            <single_read_retries>4</single_read_retries>
+            <min_bytes_for_seek>1000</min_bytes_for_seek>
+            <metadata_path>/var/lib/clickhouse/disks/s3/</metadata_path>
+            <skip_access_check>false</skip_access_check>
+        </s3>
+    </disks>
+    ...
+</storage_configuration>
+```
+
+必须的参数：
+
+- `endpoint` - S3的结点URL，以`path`或`virtual hosted`[格式](https://docs.aws.amazon.com/AmazonS3/latest/dev/VirtualHosting.html)书写。
+- `access_key_id` - S3的Access Key ID。
+- `secret_access_key` - S3的Secret Access Key。
+
+可选参数：
+
+- `region` - S3的区域名称
+- `use_environment_credentials` - 从环境变量AWS_ACCESS_KEY_ID、AWS_SECRET_ACCESS_KEY和AWS_SESSION_TOKEN中读取认证参数。默认值为`false`。
+- `use_insecure_imds_request` - 如果设置为`true`，S3客户端在认证时会使用不安全的IMDS请求。默认值为`false`。
+- `proxy` - 访问S3结点URL时代理设置。每一个`uri`项的值都应该是合法的代理URL。
+- `connect_timeout_ms` - Socket连接超时时间，默认值为`10000`，即10秒。
+- `request_timeout_ms` - 请求超时时间，默认值为`5000`，即5秒。
+- `retry_attempts` - 请求失败后的重试次数，默认值为10。
+- `single_read_retries` - 读过程中连接丢失后重试次数，默认值为4。
+- `min_bytes_for_seek` - 使用查找操作，而不是顺序读操作的最小字节数，默认值为1000。
+- `metadata_path` - 本地存放S3元数据文件的路径，默认值为`/var/lib/clickhouse/disks/<disk_name>/`
+- `skip_access_check` - 如果为`true`，Clickhouse启动时不检查磁盘是否可用。默认为`false`。
+- `server_side_encryption_customer_key_base64` - 如果指定该项的值，请求时会加上为了访问SSE-C加密数据而必须的头信息。
+
+S3磁盘也可以设置冷热存储：
+```xml
+<storage_configuration>
+    ...
+    <disks>
+        <s3>
+            <type>s3</type>
+            <endpoint>https://storage.yandexcloud.net/my-bucket/root-path/</endpoint>
+            <access_key_id>your_access_key_id</access_key_id>
+            <secret_access_key>your_secret_access_key</secret_access_key>
+        </s3>
+    </disks>
+    <policies>
+        <s3_main>
+            <volumes>
+                <main>
+                    <disk>s3</disk>
+                </main>
+            </volumes>
+        </s3_main>
+        <s3_cold>
+            <volumes>
+                <main>
+                    <disk>default</disk>
+                </main>
+                <external>
+                    <disk>s3</disk>
+                </external>
+            </volumes>
+            <move_factor>0.2</move_factor>
+        </s3_cold>
+    </policies>
+    ...
+</storage_configuration>
+```
+
+指定了`cold`选项后，本地磁盘剩余空间如果小于`move_factor * disk_size`，或有TTL设置时，数据就会定时迁移至S3了。
+
+## 虚拟列 {#virtual-columns}
+
+-    `_part` - 分区名称。
+-    `_part_index` - 作为请求的结果，按顺序排列的分区数。
+-    `_partition_id` — 分区名称。
+-    `_part_uuid` - 唯一部分标识符（如果 MergeTree 设置`assign_part_uuids` 已启用）。
+-    `_partition_value` — `partition by` 表达式的值（元组）。
+-    `_sample_factor` - 采样因子（来自请求）。
diff --git a/docs/zh/faq/general/dbms-naming.md b/docs/zh/faq/general/dbms-naming.md
index e732c2f054e..f24b3134093 100644
--- a/docs/zh/faq/general/dbms-naming.md
+++ b/docs/zh/faq/general/dbms-naming.md
@@ -1,18 +1,18 @@
----
+---
 slug: /zh/faq/general/dbms-naming
-title: "\u201CClickHouse\u201D 有什么含义?"
-toc_hidden: true
-sidebar_position: 10
----
-
-# “ClickHouse” 有什么含义? {#what-does-clickhouse-mean}
-
-它是“**点击**流”和“数据**仓库**”的组合。它来自于Yandex最初的用例。在Metrica网站上，ClickHouse本应该保存人们在互联网上的所有点击记录，现在它仍然在做这项工作。你可以在[ClickHouse history](../../introduction/history.md)页面上阅读更多关于这个用例的信息。
-
-这个由两部分组成的意思有两个结果:
-
-- 唯一正确的写“Click**H**ouse”的方式是用大写H。
-- 如果需要缩写，请使用“**CH**”。由于一些历史原因，缩写CK在中国也很流行，主要是因为中文中最早的一个关于ClickHouse的演讲使用了这种形式。
-
-!!! info “有趣的事实”
-    多年后ClickHouse闻名于世, 这种命名方法：结合各有深意的两个词被赞扬为最好的数据库命名方式, 卡内基梅隆大学数据库副教授[Andy Pavlo做的研究](https://www.cs.cmu.edu/~pavlo/blog/2020/03/on-naming-a-database-management-system.html) 。ClickHouse与Postgres共同获得“史上最佳数据库名”奖。
+title: "\u201CClickHouse\u201D 有什么含义?"
+toc_hidden: true
+sidebar_position: 10
+---
+
+# “ClickHouse” 有什么含义? {#what-does-clickhouse-mean}
+
+它是“**点击**流”和“数据**仓库**”的组合。它来自于Yandex最初的用例。在Metrica网站上，ClickHouse本应该保存人们在互联网上的所有点击记录，现在它仍然在做这项工作。你可以在[ClickHouse history](../../introduction/history.md)页面上阅读更多关于这个用例的信息。
+
+这个由两部分组成的意思有两个结果:
+
+- 唯一正确的写“Click**H**ouse”的方式是用大写H。
+- 如果需要缩写，请使用“**CH**”。由于一些历史原因，缩写CK在中国也很流行，主要是因为中文中最早的一个关于ClickHouse的演讲使用了这种形式。
+
+!!! info “有趣的事实”
+    多年后ClickHouse闻名于世, 这种命名方法：结合各有深意的两个词被赞扬为最好的数据库命名方式, 卡内基梅隆大学数据库副教授[Andy Pavlo做的研究](https://www.cs.cmu.edu/~pavlo/blog/2020/03/on-naming-a-database-management-system.html) 。ClickHouse与Postgres共同获得“史上最佳数据库名”奖。
diff --git a/docs/zh/faq/general/how-do-i-contribute-code-to-clickhouse.md b/docs/zh/faq/general/how-do-i-contribute-code-to-clickhouse.md
index daa7abf525f..16f48baf7ef 100644
--- a/docs/zh/faq/general/how-do-i-contribute-code-to-clickhouse.md
+++ b/docs/zh/faq/general/how-do-i-contribute-code-to-clickhouse.md
@@ -1,18 +1,18 @@
----
+---
 slug: /zh/faq/general/how-do-i-contribute-code-to-clickhouse
-title: 我如何为ClickHouse贡献代码?
-toc_hidden: true
-sidebar_position: 120
----
-
-# 我如何为ClickHouse贡献代码? {#how-do-i-contribute-code-to-clickhouse}
-
-ClickHouse是一个开源项目[在GitHub上开发](https://github.com/ClickHouse/ClickHouse)。
-
-按照惯例，贡献指南发布在源代码库根目录的 [CONTRIBUTING.md](https://github.com/ClickHouse/ClickHouse/blob/master/CONTRIBUTING.md)文件中。
-
-如果你想对ClickHouse提出实质性的改变建议，可以考虑[在GitHub上发布一个问题](https://github.com/ClickHouse/ClickHouse/issues/new/choose)，解释一下你想做什么，先与维护人员和社区讨论一下。[此类RFC问题的例子](https://github.com/ClickHouse/ClickHouse/issues?q=is%3Aissue+is%3Aopen+rfc)。
-
-如果您的贡献与安全相关，也请查看[我们的安全政策](https://github.com/ClickHouse/ClickHouse/security/policy/)。
-
-
+title: 我如何为ClickHouse贡献代码?
+toc_hidden: true
+sidebar_position: 120
+---
+
+# 我如何为ClickHouse贡献代码? {#how-do-i-contribute-code-to-clickhouse}
+
+ClickHouse是一个开源项目[在GitHub上开发](https://github.com/ClickHouse/ClickHouse)。
+
+按照惯例，贡献指南发布在源代码库根目录的 [CONTRIBUTING.md](https://github.com/ClickHouse/ClickHouse/blob/master/CONTRIBUTING.md)文件中。
+
+如果你想对ClickHouse提出实质性的改变建议，可以考虑[在GitHub上发布一个问题](https://github.com/ClickHouse/ClickHouse/issues/new/choose)，解释一下你想做什么，先与维护人员和社区讨论一下。[此类RFC问题的例子](https://github.com/ClickHouse/ClickHouse/issues?q=is%3Aissue+is%3Aopen+rfc)。
+
+如果您的贡献与安全相关，也请查看[我们的安全政策](https://github.com/ClickHouse/ClickHouse/security/policy/)。
+
+
diff --git a/docs/zh/faq/integration/index.md b/docs/zh/faq/integration/index.md
index 3a3f97761f3..b0ca2d05c05 100644
--- a/docs/zh/faq/integration/index.md
+++ b/docs/zh/faq/integration/index.md
@@ -1,22 +1,22 @@
----
-slug: /zh/faq/integration/
-title: 关于集成ClickHouse和其他系统的问题
-toc_hidden_folder: true
-sidebar_position: 4
-sidebar_label: Integration
----
-
-# 关于集成ClickHouse和其他系统的问题 {#question-about-integrating-clickhouse-and-other-systems}
-
-问题:
-
--   [如何从 ClickHouse 导出数据到一个文件?](../../faq/integration/file-export.md)
--   [如何导入JSON到ClickHouse?](../../faq/integration/json-import.md)
--   [如果我用ODBC链接Oracle数据库出现编码问题该怎么办?](../../faq/integration/oracle-odbc.md)
-
-
-
-!!! info "没看到你要找的东西吗?"
-    查看[其他faq类别](../../faq/index.md)或浏览左边栏中的主要文档文章。
-
+---
+slug: /zh/faq/integration/
+title: 关于集成ClickHouse和其他系统的问题
+toc_hidden_folder: true
+sidebar_position: 4
+sidebar_label: Integration
+---
+
+# 关于集成ClickHouse和其他系统的问题 {#question-about-integrating-clickhouse-and-other-systems}
+
+问题:
+
+-   [如何从 ClickHouse 导出数据到一个文件?](../../faq/integration/file-export.md)
+-   [如何导入JSON到ClickHouse?](../../faq/integration/json-import.md)
+-   [如果我用ODBC链接Oracle数据库出现编码问题该怎么办?](../../faq/integration/oracle-odbc.md)
+
+
+
+!!! info "没看到你要找的东西吗?"
+    查看[其他faq类别](../../faq/index.md)或浏览左边栏中的主要文档文章。
+
 {## [原文](https://clickhouse.com/docs/en/faq/integration/) ##}
\ No newline at end of file
diff --git a/docs/zh/faq/operations/index.md b/docs/zh/faq/operations/index.md
index 153eda6199a..1fe84655ada 100644
--- a/docs/zh/faq/operations/index.md
+++ b/docs/zh/faq/operations/index.md
@@ -1,21 +1,21 @@
----
-slug: /zh/faq/operations/
-title: 关于操作ClickHouse服务器和集群的问题
-toc_hidden_folder: true
-sidebar_position: 3
-sidebar_label: Operations
----
-
-# 关于操作ClickHouse服务器和集群的问题 {#question-about-operating-clickhouse-servers-and-clusters}
-
-问题:
-
--   [如果想在生产环境部署，需要用哪个版本的 ClickHouse 呢?](../../faq/operations/production.md)
--   [是否可能从 ClickHouse 数据表中删除所有旧的数据记录?](../../faq/operations/delete-old-data.md)
--   [ClickHouse支持多区域复制吗?](../../faq/operations/multi-region-replication.md)
-
-
-!!! info "没看到你要找的东西吗?"
-    查看[其他faq类别](../../faq/index.md)或浏览左边栏中的主要文档文章。
-
-{## [原文](https://clickhouse.com/docs/en/faq/production/) ##}
+---
+slug: /zh/faq/operations/
+title: 关于操作ClickHouse服务器和集群的问题
+toc_hidden_folder: true
+sidebar_position: 3
+sidebar_label: Operations
+---
+
+# 关于操作ClickHouse服务器和集群的问题 {#question-about-operating-clickhouse-servers-and-clusters}
+
+问题:
+
+-   [如果想在生产环境部署，需要用哪个版本的 ClickHouse 呢?](../../faq/operations/production.md)
+-   [是否可能从 ClickHouse 数据表中删除所有旧的数据记录?](../../faq/operations/delete-old-data.md)
+-   [ClickHouse支持多区域复制吗?](../../faq/operations/multi-region-replication.md)
+
+
+!!! info "没看到你要找的东西吗?"
+    查看[其他faq类别](../../faq/index.md)或浏览左边栏中的主要文档文章。
+
+{## [原文](https://clickhouse.com/docs/en/faq/production/) ##}
diff --git a/docs/zh/faq/operations/multi-region-replication.md b/docs/zh/faq/operations/multi-region-replication.md
index 05f856a9ea7..14df8b72eff 100644
--- a/docs/zh/faq/operations/multi-region-replication.md
+++ b/docs/zh/faq/operations/multi-region-replication.md
@@ -1,15 +1,15 @@
----
+---
 slug: /zh/faq/operations/multi-region-replication
-title: ClickHouse支持多区域复制吗?
-toc_hidden: true
-sidebar_position: 30
----
-
-# ClickHouse支持多区域复制吗? {#does-clickhouse-support-multi-region-replication}
-
-简短的回答是“是的”。然而，我们建议将所有区域/数据中心之间的延迟保持在两位数字范围内，否则，在通过分布式共识协议时，写性能将受到影响。例如，美国海岸之间的复制可能会很好，但美国和欧洲之间就不行。
-
-在配置方面，这与单区域复制没有区别，只是使用位于不同位置的主机作为副本。
-
-更多信息，请参见[关于数据复制的完整文章](../../engines/table-engines/mergetree-family/replication.md)。
-
+title: ClickHouse支持多区域复制吗?
+toc_hidden: true
+sidebar_position: 30
+---
+
+# ClickHouse支持多区域复制吗? {#does-clickhouse-support-multi-region-replication}
+
+简短的回答是“是的”。然而，我们建议将所有区域/数据中心之间的延迟保持在两位数字范围内，否则，在通过分布式共识协议时，写性能将受到影响。例如，美国海岸之间的复制可能会很好，但美国和欧洲之间就不行。
+
+在配置方面，这与单区域复制没有区别，只是使用位于不同位置的主机作为副本。
+
+更多信息，请参见[关于数据复制的完整文章](../../engines/table-engines/mergetree-family/replication.md)。
+
diff --git a/docs/zh/operations/settings/settings.md b/docs/zh/operations/settings/settings.md
index 86e205ea401..1874970ac95 100644
--- a/docs/zh/operations/settings/settings.md
+++ b/docs/zh/operations/settings/settings.md
@@ -1203,7 +1203,7 @@ ClickHouse生成异常
 -   类型：布尔
 -   默认值：True
 
-启用数据格式的保序并行分析。 仅支持TSV，TKSV，CSV和JSONEachRow格式。
+启用数据格式的保序并行分析。 仅支持TSV，TSKV，CSV和JSONEachRow格式。
 
 ## min_chunk_bytes_for_parallel_parsing {#min-chunk-bytes-for-parallel-parsing}
 
diff --git a/docs/zh/operations/system-tables/storage_policies.md b/docs/zh/operations/system-tables/storage_policies.md
index e29915a98da..27219f789f4 100644
--- a/docs/zh/operations/system-tables/storage_policies.md
+++ b/docs/zh/operations/system-tables/storage_policies.md
@@ -13,6 +13,5 @@ slug: /zh/operations/system-tables/storage_policies
 -   `disks` ([Array(String)](../../sql-reference/data-types/array.md)) — 存储策略中定义的磁盘名。
 -   `max_data_part_size` ([UInt64](../../sql-reference/data-types/int-uint.md)) — 可以存储在卷磁盘上数据部分的最大大小 (0 - 不限制)。
 -   `move_factor` ([Float64](../../sql-reference/data-types/float.md)) — 磁盘空闲的比率。当比率超过配置的值，ClickHouse 将把数据向下一个卷移动。
--   `prefer_not_to_merge` ([UInt8](../../sql-reference/data-types/int-uint.md)) — 设置中 `prefer_not_to_merge` 的值. 当这个设置启用时，不允许在此卷上合并数据。这将允许控制 ClickHouse 如何与运行速度较慢的磁盘一起工作。
 
 如果存储策略包含多个卷，则每个卷的信息将在表中作为单独一行存储。
diff --git a/docs/zh/sql-reference/statements/select/order-by.md b/docs/zh/sql-reference/statements/select/order-by.md
index 01f702a4b1e..3286fc9f9e7 100644
--- a/docs/zh/sql-reference/statements/select/order-by.md
+++ b/docs/zh/sql-reference/statements/select/order-by.md
@@ -61,6 +61,22 @@ sidebar_label: ORDER BY
 
 我们只建议使用 `COLLATE` 对于少量行的最终排序，因为排序与 `COLLATE` 比正常的按字节排序效率低。
 
+## ORDER BY ALL
+
+`ORDER BY ALL` 对所有选定的列进行升序排序。
+
+示例:
+
+``` sql
+SELECT a, b, c FROM t ORDER BY ALL
+```
+
+等同于：
+
+``` sql
+SELECT a, b, c FROM t ORDER BY a, b, c
+```
+
 ## 实现细节 {#implementation-details}
 
 更少的RAM使用，如果一个足够小 [LIMIT](../../../sql-reference/statements/select/limit.md) 除了指定 `ORDER BY`. 否则，所花费的内存量与用于排序的数据量成正比。 对于分布式查询处理，如果 [GROUP BY](../../../sql-reference/statements/select/group-by.md) 省略排序，在远程服务器上部分完成排序，并将结果合并到请求者服务器上。 这意味着对于分布式排序，要排序的数据量可以大于单个服务器上的内存量。
diff --git a/docs/zh/sql-reference/table-functions/s3.md b/docs/zh/sql-reference/table-functions/s3.md
index a62fa9ebb19..f7384a7526e 100644
--- a/docs/zh/sql-reference/table-functions/s3.md
+++ b/docs/zh/sql-reference/table-functions/s3.md
@@ -11,7 +11,7 @@ sidebar_label: s3
 **语法**
 
 ``` sql
-s3(path, [aws_access_key_id, aws_secret_access_key,] format, structure, [compression])
+s3(path [,access_key_id, secret_access_key [,session_token]] ,format, structure, [compression])
 ```
 
 **参数**
diff --git a/programs/bash-completion/completions/ch b/programs/bash-completion/completions/ch
new file mode 120000
index 00000000000..7101fd9ed04
--- /dev/null
+++ b/programs/bash-completion/completions/ch
@@ -0,0 +1 @@
+clickhouse
\ No newline at end of file
diff --git a/programs/bash-completion/completions/chc b/programs/bash-completion/completions/chc
new file mode 100644
index 00000000000..0e34cd4eab2
--- /dev/null
+++ b/programs/bash-completion/completions/chc
@@ -0,0 +1,2 @@
+[[ -v $_CLICKHOUSE_COMPLETION_LOADED ]] || source "$(dirname "${BASH_SOURCE[0]}")/clickhouse-bootstrap"
+_complete_clickhouse_generic chc
diff --git a/programs/bash-completion/completions/chl b/programs/bash-completion/completions/chl
new file mode 100644
index 00000000000..6d0338bf122
--- /dev/null
+++ b/programs/bash-completion/completions/chl
@@ -0,0 +1,2 @@
+[[ -v $_CLICKHOUSE_COMPLETION_LOADED ]] || source "$(dirname "${BASH_SOURCE[0]}")/clickhouse-bootstrap"
+_complete_clickhouse_generic chl
diff --git a/programs/bash-completion/completions/clickhouse b/programs/bash-completion/completions/clickhouse
index fc55398dcf1..ff0a60c60be 100644
--- a/programs/bash-completion/completions/clickhouse
+++ b/programs/bash-completion/completions/clickhouse
@@ -31,3 +31,4 @@ function _complete_for_clickhouse_entrypoint_bin()
 }
 
 _complete_clickhouse_generic clickhouse _complete_for_clickhouse_entrypoint_bin
+_complete_clickhouse_generic ch _complete_for_clickhouse_entrypoint_bin
diff --git a/programs/benchmark/Benchmark.cpp b/programs/benchmark/Benchmark.cpp
index d6b8b38d84d..59fc6c0c17f 100644
--- a/programs/benchmark/Benchmark.cpp
+++ b/programs/benchmark/Benchmark.cpp
@@ -35,7 +35,6 @@
 #include <Common/StudentTTest.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/ErrorCodes.h>
-#include <filesystem>
 
 
 /** A tool for evaluating ClickHouse performance.
@@ -405,7 +404,7 @@ private:
             || sigaddset(&sig_set, SIGINT)
             || pthread_sigmask(SIG_BLOCK, &sig_set, nullptr))
         {
-            throwFromErrno("Cannot block signal.", ErrorCodes::CANNOT_BLOCK_SIGNAL);
+            throw ErrnoException(ErrorCodes::CANNOT_BLOCK_SIGNAL, "Cannot block signal");
         }
 
         while (true)
diff --git a/programs/copier/ClusterCopierApp.cpp b/programs/copier/ClusterCopierApp.cpp
index 8f24d13d379..e3371185aad 100644
--- a/programs/copier/ClusterCopierApp.cpp
+++ b/programs/copier/ClusterCopierApp.cpp
@@ -2,6 +2,7 @@
 #include <Common/ZooKeeper/ZooKeeper.h>
 #include <Common/StatusFile.h>
 #include <Common/TerminalSize.h>
+#include <Databases/registerDatabases.h>
 #include <IO/ConnectionTimeouts.h>
 #include <Formats/registerFormats.h>
 #include <Common/scope_guard_safe.h>
@@ -159,6 +160,7 @@ void ClusterCopierApp::mainImpl()
     registerFunctions();
     registerAggregateFunctions();
     registerTableFunctions();
+    registerDatabases();
     registerStorages();
     registerDictionaries();
     registerDisks(/* global_skip_access_check= */ true);
diff --git a/programs/disks/CommandCopy.cpp b/programs/disks/CommandCopy.cpp
index 421e4038d12..f176fa277d7 100644
--- a/programs/disks/CommandCopy.cpp
+++ b/programs/disks/CommandCopy.cpp
@@ -36,7 +36,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 2)
@@ -51,8 +51,8 @@ public:
         const String & path_from = command_arguments[0];
         const String & path_to =  command_arguments[1];
 
-        DiskPtr disk_from = global_context->getDisk(disk_name_from);
-        DiskPtr disk_to = global_context->getDisk(disk_name_to);
+        DiskPtr disk_from = disk_selector->get(disk_name_from);
+        DiskPtr disk_to = disk_selector->get(disk_name_to);
 
         String relative_path_from = validatePathAndGetAsRelative(path_from);
         String relative_path_to = validatePathAndGetAsRelative(path_to);
diff --git a/programs/disks/CommandLink.cpp b/programs/disks/CommandLink.cpp
index 357832865fb..dbaa3162f82 100644
--- a/programs/disks/CommandLink.cpp
+++ b/programs/disks/CommandLink.cpp
@@ -27,7 +27,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 2)
@@ -41,7 +41,7 @@ public:
         const String & path_from = command_arguments[0];
         const String & path_to = command_arguments[1];
 
-        DiskPtr disk = global_context->getDisk(disk_name);
+        DiskPtr disk = disk_selector->get(disk_name);
 
         String relative_path_from = validatePathAndGetAsRelative(path_from);
         String relative_path_to = validatePathAndGetAsRelative(path_to);
diff --git a/programs/disks/CommandList.cpp b/programs/disks/CommandList.cpp
index 48b54b70014..ea84cd0682d 100644
--- a/programs/disks/CommandList.cpp
+++ b/programs/disks/CommandList.cpp
@@ -33,7 +33,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 1)
@@ -46,7 +46,7 @@ public:
 
         const String & path =  command_arguments[0];
 
-        DiskPtr disk = global_context->getDisk(disk_name);
+        DiskPtr disk = disk_selector->get(disk_name);
 
         String relative_path = validatePathAndGetAsRelative(path);
 
diff --git a/programs/disks/CommandListDisks.cpp b/programs/disks/CommandListDisks.cpp
index 7b2fcd16107..79da021fd00 100644
--- a/programs/disks/CommandListDisks.cpp
+++ b/programs/disks/CommandListDisks.cpp
@@ -26,8 +26,8 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
-        Poco::Util::LayeredConfiguration &) override
+        std::shared_ptr<DiskSelector> &,
+        Poco::Util::LayeredConfiguration & config) override
     {
         if (!command_arguments.empty())
         {
@@ -35,8 +35,29 @@ public:
             throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Bad Arguments");
         }
 
-        for (const auto & [disk_name, _] : global_context->getDisksMap())
-            std::cout << disk_name << '\n';
+        constexpr auto config_prefix = "storage_configuration.disks";
+        constexpr auto default_disk_name = "default";
+
+        Poco::Util::AbstractConfiguration::Keys keys;
+        config.keys(config_prefix, keys);
+
+        bool has_default_disk = false;
+
+        /// For the output to be ordered
+        std::set<String> disks;
+
+        for (const auto & disk_name : keys)
+        {
+            if (disk_name == default_disk_name)
+                has_default_disk = true;
+            disks.insert(disk_name);
+        }
+
+        if (!has_default_disk)
+            disks.insert(default_disk_name);
+
+        for (const auto & disk : disks)
+            std::cout << disk << '\n';
     }
 };
 }
diff --git a/programs/disks/CommandMkDir.cpp b/programs/disks/CommandMkDir.cpp
index e5df982d896..6d33bdec498 100644
--- a/programs/disks/CommandMkDir.cpp
+++ b/programs/disks/CommandMkDir.cpp
@@ -34,7 +34,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 1)
@@ -47,7 +47,7 @@ public:
 
         const String & path = command_arguments[0];
 
-        DiskPtr disk = global_context->getDisk(disk_name);
+        DiskPtr disk = disk_selector->get(disk_name);
 
         String relative_path = validatePathAndGetAsRelative(path);
         bool recursive = config.getBool("recursive", false);
diff --git a/programs/disks/CommandMove.cpp b/programs/disks/CommandMove.cpp
index 654090b2138..75cf96252ed 100644
--- a/programs/disks/CommandMove.cpp
+++ b/programs/disks/CommandMove.cpp
@@ -26,7 +26,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 2)
@@ -40,7 +40,7 @@ public:
         const String & path_from = command_arguments[0];
         const String & path_to = command_arguments[1];
 
-        DiskPtr disk = global_context->getDisk(disk_name);
+        DiskPtr disk = disk_selector->get(disk_name);
 
         String relative_path_from = validatePathAndGetAsRelative(path_from);
         String relative_path_to = validatePathAndGetAsRelative(path_to);
diff --git a/programs/disks/CommandRead.cpp b/programs/disks/CommandRead.cpp
index b6cacdd2c61..85041faf22c 100644
--- a/programs/disks/CommandRead.cpp
+++ b/programs/disks/CommandRead.cpp
@@ -36,7 +36,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+       std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 1)
@@ -47,7 +47,7 @@ public:
 
         String disk_name = config.getString("disk", "default");
 
-        DiskPtr disk = global_context->getDisk(disk_name);
+        DiskPtr disk = disk_selector->get(disk_name);
 
         String relative_path = validatePathAndGetAsRelative(command_arguments[0]);
 
diff --git a/programs/disks/CommandRemove.cpp b/programs/disks/CommandRemove.cpp
index ff8d4a1c6bb..0c631eacff3 100644
--- a/programs/disks/CommandRemove.cpp
+++ b/programs/disks/CommandRemove.cpp
@@ -26,7 +26,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 1)
@@ -39,7 +39,7 @@ public:
 
         const String & path = command_arguments[0];
 
-        DiskPtr disk = global_context->getDisk(disk_name);
+        DiskPtr disk = disk_selector->get(disk_name);
 
         String relative_path = validatePathAndGetAsRelative(path);
 
diff --git a/programs/disks/CommandWrite.cpp b/programs/disks/CommandWrite.cpp
index d075daf3215..7ded37e067a 100644
--- a/programs/disks/CommandWrite.cpp
+++ b/programs/disks/CommandWrite.cpp
@@ -37,7 +37,7 @@ public:
 
     void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) override
     {
         if (command_arguments.size() != 1)
@@ -50,7 +50,7 @@ public:
 
         const String & path = command_arguments[0];
 
-        DiskPtr disk = global_context->getDisk(disk_name);
+        DiskPtr disk = disk_selector->get(disk_name);
 
         String relative_path = validatePathAndGetAsRelative(path);
 
diff --git a/programs/disks/DisksApp.cpp b/programs/disks/DisksApp.cpp
index b81cd52f8c8..ded324fd0da 100644
--- a/programs/disks/DisksApp.cpp
+++ b/programs/disks/DisksApp.cpp
@@ -209,7 +209,35 @@ int DisksApp::main(const std::vector<String> & /*args*/)
         po::parsed_options parsed = parser.run();
         args = po::collect_unrecognized(parsed.options, po::collect_unrecognized_mode::include_positional);
     }
-    command->execute(args, global_context, config());
+
+    std::unordered_set<std::string> disks
+    {
+        config().getString("disk", "default"),
+        config().getString("disk-from", config().getString("disk", "default")),
+        config().getString("disk-to", config().getString("disk", "default")),
+    };
+
+    auto validator = [&disks](
+        const Poco::Util::AbstractConfiguration & config,
+        const std::string & disk_config_prefix,
+        const std::string & disk_name)
+    {
+        if (!disks.contains(disk_name))
+            return false;
+
+        const auto disk_type = config.getString(disk_config_prefix + ".type", "local");
+
+        if (disk_type == "cache")
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Disk type 'cache' of disk {} is not supported by clickhouse-disks", disk_name);
+
+        return true;
+    };
+
+    constexpr auto config_prefix = "storage_configuration.disks";
+    auto disk_selector = std::make_shared<DiskSelector>();
+    disk_selector->initialize(config(), config_prefix, global_context, validator);
+
+    command->execute(args, disk_selector, config());
 
     return Application::EXIT_OK;
 }
diff --git a/programs/disks/ICommand.h b/programs/disks/ICommand.h
index de41eedec35..da106e1084e 100644
--- a/programs/disks/ICommand.h
+++ b/programs/disks/ICommand.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Disks/IDisk.h>
+#include <Disks/DiskSelector.h>
 
 #include <boost/program_options.hpp>
 
@@ -25,7 +26,7 @@ public:
 
     virtual void execute(
         const std::vector<String> & command_arguments,
-        DB::ContextMutablePtr & global_context,
+        std::shared_ptr<DiskSelector> & disk_selector,
         Poco::Util::LayeredConfiguration & config) = 0;
 
     const std::optional<ProgramOptionsDescription> & getCommandOptions() const { return command_option_description; }
diff --git a/programs/format/Format.cpp b/programs/format/Format.cpp
index d7d61bbcd3b..05ba86069d7 100644
--- a/programs/format/Format.cpp
+++ b/programs/format/Format.cpp
@@ -17,6 +17,7 @@
 
 #include <Interpreters/Context.h>
 #include <Functions/FunctionFactory.h>
+#include <Databases/registerDatabases.h>
 #include <Functions/registerFunctions.h>
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <AggregateFunctions/registerAggregateFunctions.h>
@@ -24,6 +25,7 @@
 #include <TableFunctions/registerTableFunctions.h>
 #include <Storages/StorageFactory.h>
 #include <Storages/registerStorages.h>
+#include <Storages/MergeTree/MergeTreeSettings.h>
 #include <DataTypes/DataTypeFactory.h>
 #include <Formats/FormatFactory.h>
 #include <Formats/registerFormats.h>
@@ -32,6 +34,9 @@
 #pragma GCC diagnostic ignored "-Wunused-function"
 #pragma GCC diagnostic ignored "-Wmissing-declarations"
 
+extern const char * auto_time_zones[];
+
+
 namespace DB
 {
 namespace ErrorCodes
@@ -126,6 +131,7 @@ int mainEntryClickHouseFormat(int argc, char ** argv)
             registerFunctions();
             registerAggregateFunctions();
             registerTableFunctions();
+            registerDatabases();
             registerStorages();
             registerFormats();
 
@@ -133,9 +139,25 @@ int mainEntryClickHouseFormat(int argc, char ** argv)
 
             auto all_known_storage_names = StorageFactory::instance().getAllRegisteredNames();
             auto all_known_data_type_names = DataTypeFactory::instance().getAllRegisteredNames();
+            auto all_known_settings = Settings().getAllRegisteredNames();
+            auto all_known_merge_tree_settings = MergeTreeSettings().getAllRegisteredNames();
 
             additional_names.insert(all_known_storage_names.begin(), all_known_storage_names.end());
             additional_names.insert(all_known_data_type_names.begin(), all_known_data_type_names.end());
+            additional_names.insert(all_known_settings.begin(), all_known_settings.end());
+            additional_names.insert(all_known_merge_tree_settings.begin(), all_known_merge_tree_settings.end());
+
+            for (auto * it = auto_time_zones; *it; ++it)
+            {
+                String time_zone_name = *it;
+
+                /// Example: Europe/Amsterdam
+                Strings split;
+                boost::split(split, time_zone_name, [](char c){ return c == '/'; });
+                for (const auto & word : split)
+                    if (!word.empty())
+                        additional_names.insert(word);
+            }
 
             KnownIdentifierFunc is_known_identifier = [&](std::string_view name)
             {
diff --git a/programs/install/Install.cpp b/programs/install/Install.cpp
index 9d4d791263b..52f30098b38 100644
--- a/programs/install/Install.cpp
+++ b/programs/install/Install.cpp
@@ -328,7 +328,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                 fs::create_symlink(binary_self_canonical_path, main_bin_path);
 
                 if (0 != chmod(binary_self_canonical_path.string().c_str(), S_IRUSR | S_IRGRP | S_IROTH | S_IXUSR | S_IXGRP | S_IXOTH))
-                    throwFromErrno(fmt::format("Cannot chmod {}", binary_self_canonical_path.string()), ErrorCodes::SYSTEM_ERROR);
+                    throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot chmod {}", binary_self_canonical_path.string());
             }
         }
         else
@@ -361,7 +361,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
             if (already_installed)
             {
                 if (0 != chmod(main_bin_path.string().c_str(), S_IRUSR | S_IRGRP | S_IROTH | S_IXUSR | S_IXGRP | S_IXOTH))
-                    throwFromErrno(fmt::format("Cannot chmod {}", main_bin_path.string()), ErrorCodes::SYSTEM_ERROR);
+                    throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot chmod {}", main_bin_path.string());
             }
             else
             {
@@ -395,7 +395,7 @@ int mainEntryClickHouseInstall(int argc, char ** argv)
                     }
 
                     if (0 != chmod(destination.c_str(), S_IRUSR | S_IRGRP | S_IROTH | S_IXUSR | S_IXGRP | S_IXOTH))
-                        throwFromErrno(fmt::format("Cannot chmod {}", main_bin_tmp_path.string()), ErrorCodes::SYSTEM_ERROR);
+                        throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot chmod {}", main_bin_tmp_path.string());
                 }
                 catch (const Exception & e)
                 {
@@ -1122,7 +1122,7 @@ namespace
                 return 0;
             }
             else
-                throwFromErrno(fmt::format("Cannot obtain the status of pid {} with `kill`", pid), ErrorCodes::CANNOT_KILL);
+                throw ErrnoException(ErrorCodes::CANNOT_KILL, "Cannot obtain the status of pid {} with `kill`", pid);
         }
 
         if (!pid)
@@ -1143,7 +1143,7 @@ namespace
         if (0 == kill(pid, signal))
             fmt::print("Sent {} signal to process with pid {}.\n", signal_name, pid);
         else
-            throwFromErrno(fmt::format("Cannot send {} signal", signal_name), ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot send {} signal", signal_name);
 
         size_t try_num = 0;
         for (; try_num < max_tries; ++try_num)
diff --git a/programs/keeper/CMakeLists.txt b/programs/keeper/CMakeLists.txt
index cdb1d89b18e..b8f538f821c 100644
--- a/programs/keeper/CMakeLists.txt
+++ b/programs/keeper/CMakeLists.txt
@@ -68,6 +68,7 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/waitServersToFinish.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/ServerType.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTPRequestHandlerFactoryMain.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/KeeperReadinessHandler.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTP/HTTPServer.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTP/ReadHeaders.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Server/HTTP/HTTPServerConnection.cpp
@@ -114,6 +115,7 @@ if (BUILD_STANDALONE_KEEPER)
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/LocalDirectorySyncGuard.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/TemporaryFileOnDisk.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/loadLocalDiskConfig.cpp
+        ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/DiskType.cpp
 
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/IObjectStorage.cpp
         ${CMAKE_CURRENT_SOURCE_DIR}/../../src/Disks/ObjectStorages/MetadataStorageFromPlainObjectStorage.cpp
diff --git a/programs/keeper/Keeper.cpp b/programs/keeper/Keeper.cpp
index e04e669abae..48d26233d94 100644
--- a/programs/keeper/Keeper.cpp
+++ b/programs/keeper/Keeper.cpp
@@ -14,6 +14,7 @@
 #include <Common/assertProcessUserMatchesDataOwner.h>
 #include <Common/makeSocketAddress.h>
 #include <Server/waitServersToFinish.h>
+#include <base/getMemoryAmount.h>
 #include <base/scope_guard.h>
 #include <base/safeExit.h>
 #include <Poco/Net/NetException.h>
@@ -32,6 +33,7 @@
 #include <Server/HTTP/HTTPServer.h>
 #include <Server/TCPServer.h>
 #include <Server/HTTPHandlerFactory.h>
+#include <Server/KeeperReadinessHandler.h>
 
 #include "Core/Defines.h"
 #include "config.h"
@@ -289,6 +291,33 @@ try
     if (!config().has("keeper_server"))
         throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Keeper configuration (<keeper_server> section) not found in config");
 
+    auto updateMemorySoftLimitInConfig = [&](Poco::Util::AbstractConfiguration & config)
+    {
+        UInt64 memory_soft_limit = 0;
+        if (config.has("keeper_server.max_memory_usage_soft_limit"))
+        {
+            memory_soft_limit = config.getUInt64("keeper_server.max_memory_usage_soft_limit");
+        }
+
+        /// if memory soft limit is not set, we will use default value
+        if (memory_soft_limit == 0)
+        {
+            Float64 ratio = 0.9;
+            if (config.has("keeper_server.max_memory_usage_soft_limit_ratio"))
+                ratio = config.getDouble("keeper_server.max_memory_usage_soft_limit_ratio");
+
+            size_t physical_server_memory = getMemoryAmount();
+            if (ratio > 0 && physical_server_memory > 0)
+            {
+                memory_soft_limit = static_cast<UInt64>(physical_server_memory * ratio);
+                config.setUInt64("keeper_server.max_memory_usage_soft_limit", memory_soft_limit);
+            }
+        }
+        LOG_INFO(log, "keeper_server.max_memory_usage_soft_limit is set to {}", formatReadableSizeWithBinarySuffix(memory_soft_limit));
+    };
+
+    updateMemorySoftLimitInConfig(config());
+
     std::string path;
 
     if (config().has("keeper_server.storage_path"))
@@ -328,6 +357,13 @@ try
         config().getUInt("max_thread_pool_free_size", 1000),
         config().getUInt("thread_pool_queue_size", 10000)
     );
+    /// Wait for all threads to avoid possible use-after-free (for example logging objects can be already destroyed).
+    SCOPE_EXIT({
+        Stopwatch watch;
+        LOG_INFO(log, "Waiting for background threads");
+        GlobalThreadPool::instance().shutdown();
+        LOG_INFO(log, "Background threads finished in {} ms", watch.elapsedMilliseconds());
+    });
 
     static ServerErrorHandler error_handler;
     Poco::ErrorHandler::set(&error_handler);
@@ -459,6 +495,29 @@ try
                 std::make_unique<HTTPServer>(
                     std::move(my_http_context), createPrometheusMainHandlerFactory(*this, config_getter(), async_metrics, "PrometheusHandler-factory"), server_pool, socket, http_params));
         });
+
+        /// HTTP control endpoints
+        port_name = "keeper_server.http_control.port";
+        createServer(listen_host, port_name, listen_try, [&](UInt16 port) mutable
+        {
+            auto my_http_context = httpContext();
+            Poco::Timespan my_keep_alive_timeout(config.getUInt("keep_alive_timeout", 10), 0);
+            Poco::Net::HTTPServerParams::Ptr my_http_params = new Poco::Net::HTTPServerParams;
+            my_http_params->setTimeout(my_http_context->getReceiveTimeout());
+            my_http_params->setKeepAliveTimeout(my_keep_alive_timeout);
+
+            Poco::Net::ServerSocket socket;
+            auto address = socketBindListen(socket, listen_host, port);
+            socket.setReceiveTimeout(my_http_context->getReceiveTimeout());
+            socket.setSendTimeout(my_http_context->getSendTimeout());
+            servers->emplace_back(
+                listen_host,
+                port_name,
+                "HTTP Control: http://" + address.toString(),
+                std::make_unique<HTTPServer>(
+                    std::move(my_http_context), createKeeperHTTPControlMainHandlerFactory(config_getter(), global_context->getKeeperDispatcher(), "KeeperHTTPControlHandler-factory"), server_pool, socket, http_params)
+                    );
+        });
     }
 
     for (auto & server : *servers)
@@ -492,6 +551,8 @@ try
         {
             updateLevels(*config, logger());
 
+            updateMemorySoftLimitInConfig(*config);
+
             if (config->has("keeper_server"))
                 global_context->updateKeeperConfiguration(*config);
 
diff --git a/programs/local/LocalServer.cpp b/programs/local/LocalServer.cpp
index fbb64ea1135..ccd3d84630f 100644
--- a/programs/local/LocalServer.cpp
+++ b/programs/local/LocalServer.cpp
@@ -10,6 +10,7 @@
 #include <Poco/Logger.h>
 #include <Poco/NullChannel.h>
 #include <Poco/SimpleFileChannel.h>
+#include <Databases/registerDatabases.h>
 #include <Databases/DatabaseFilesystem.h>
 #include <Databases/DatabaseMemory.h>
 #include <Databases/DatabasesOverlay.h>
@@ -43,7 +44,7 @@
 #include <Parsers/IAST.h>
 #include <Parsers/ASTInsertQuery.h>
 #include <Common/ErrorHandlers.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
 #include <Functions/registerFunctions.h>
 #include <AggregateFunctions/registerAggregateFunctions.h>
 #include <TableFunctions/registerTableFunctions.h>
@@ -489,6 +490,7 @@ try
     registerFunctions();
     registerAggregateFunctions();
     registerTableFunctions();
+    registerDatabases();
     registerStorages();
     registerDictionaries();
     registerDisks(/* global_skip_access_check= */ true);
@@ -726,12 +728,7 @@ void LocalServer::processConfig()
     /// We load temporary database first, because projections need it.
     DatabaseCatalog::instance().initializeAndLoadTemporaryDatabase();
 
-    /** Init dummy default DB
-      * NOTE: We force using isolated default database to avoid conflicts with default database from server environment
-      * Otherwise, metadata of temporary File(format, EXPLICIT_PATH) tables will pollute metadata/ directory;
-      *  if such tables will not be dropped, clickhouse-server will not be able to load them due to security reasons.
-      */
-    std::string default_database = config().getString("default_database", "_local");
+    std::string default_database = config().getString("default_database", "default");
     DatabaseCatalog::instance().attachDatabase(default_database, createClickHouseLocalDatabaseOverlay(default_database, global_context));
     global_context->setCurrentDatabase(default_database);
 
@@ -744,7 +741,7 @@ void LocalServer::processConfig()
 
         LOG_DEBUG(log, "Loading metadata from {}", path);
         auto startup_system_tasks = loadMetadataSystem(global_context);
-        attachSystemTablesLocal(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::SYSTEM_DATABASE));
+        attachSystemTablesServer(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::SYSTEM_DATABASE), false);
         attachInformationSchema(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::INFORMATION_SCHEMA));
         attachInformationSchema(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::INFORMATION_SCHEMA_UPPERCASE));
         waitLoad(TablesLoaderForegroundPoolId, startup_system_tasks);
@@ -757,13 +754,13 @@ void LocalServer::processConfig()
         }
 
         /// For ClickHouse local if path is not set the loader will be disabled.
-        global_context->getUserDefinedSQLObjectsLoader().loadObjects();
+        global_context->getUserDefinedSQLObjectsStorage().loadObjects();
 
         LOG_DEBUG(log, "Loaded metadata.");
     }
     else if (!config().has("no-system-tables"))
     {
-        attachSystemTablesLocal(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::SYSTEM_DATABASE));
+        attachSystemTablesServer(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::SYSTEM_DATABASE), false);
         attachInformationSchema(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::INFORMATION_SCHEMA));
         attachInformationSchema(global_context, *createMemoryDatabaseIfNotExists(global_context, DatabaseCatalog::INFORMATION_SCHEMA_UPPERCASE));
     }
@@ -776,6 +773,7 @@ void LocalServer::processConfig()
 
     global_context->setQueryKindInitial();
     global_context->setQueryKind(query_kind);
+    global_context->setQueryParameters(query_parameters);
 }
 
 
@@ -822,6 +820,7 @@ void LocalServer::printHelpMessage([[maybe_unused]] const OptionsDescription & o
     std::cout << getHelpHeader() << "\n";
     std::cout << options_description.main_description.value() << "\n";
     std::cout << getHelpFooter() << "\n";
+    std::cout << "In addition, --param_name=value can be specified for substitution of parameters for parametrized queries.\n";
 #endif
 }
 
@@ -898,7 +897,31 @@ void LocalServer::readArguments(int argc, char ** argv, Arguments & common_argum
     for (int arg_num = 1; arg_num < argc; ++arg_num)
     {
         std::string_view arg = argv[arg_num];
-        if (arg == "--multiquery" && (arg_num + 1) < argc && !std::string_view(argv[arg_num + 1]).starts_with('-'))
+        /// Parameter arg after underline.
+        if (arg.starts_with("--param_"))
+        {
+            auto param_continuation = arg.substr(strlen("--param_"));
+            auto equal_pos = param_continuation.find_first_of('=');
+
+            if (equal_pos == std::string::npos)
+            {
+                /// param_name value
+                ++arg_num;
+                if (arg_num >= argc)
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter requires value");
+                arg = argv[arg_num];
+                query_parameters.emplace(String(param_continuation), String(arg));
+            }
+            else
+            {
+                if (equal_pos == 0)
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter name cannot be empty");
+
+                /// param_name=value
+                query_parameters.emplace(param_continuation.substr(0, equal_pos), param_continuation.substr(equal_pos + 1));
+            }
+        }
+        else if (arg == "--multiquery" && (arg_num + 1) < argc && !std::string_view(argv[arg_num + 1]).starts_with('-'))
         {
             /// Transform the abbreviated syntax '--multiquery <SQL>' into the full syntax '--multiquery -q <SQL>'
             ++arg_num;
diff --git a/programs/main.cpp b/programs/main.cpp
index 959984d565d..7d07112de66 100644
--- a/programs/main.cpp
+++ b/programs/main.cpp
@@ -158,7 +158,6 @@ std::pair<std::string_view, MainFunc> clickhouse_applications[] =
 std::pair<std::string_view, std::string_view> clickhouse_short_names[] =
 {
 #if ENABLE_CLICKHOUSE_LOCAL
-    {"ch", "local"},
     {"chl", "local"},
 #endif
 #if ENABLE_CLICKHOUSE_CLIENT
@@ -502,6 +501,17 @@ int main(int argc_, char ** argv_)
         }
     }
 
+    /// Interpret binary without argument or with arguments starts with dash
+    /// ('-') as clickhouse-local for better usability:
+    ///
+    ///     clickhouse # dumps help
+    ///     clickhouse -q 'select 1' # use local
+    ///     clickhouse # spawn local
+    ///     clickhouse local # spawn local
+    ///
+    if (main_func == printHelp && !argv.empty() && (argv.size() == 1 || argv[1][0] == '-'))
+        main_func = mainEntryClickHouseLocal;
+
     return main_func(static_cast<int>(argv.size()), argv.data());
 }
 #endif
diff --git a/programs/obfuscator/Obfuscator.cpp b/programs/obfuscator/Obfuscator.cpp
index 2cb5250cdf2..7e09d5e8046 100644
--- a/programs/obfuscator/Obfuscator.cpp
+++ b/programs/obfuscator/Obfuscator.cpp
@@ -1307,7 +1307,7 @@ try
         /// stdin must be seekable
         auto res = lseek(file->getFD(), 0, SEEK_SET);
         if (-1 == res)
-            throwFromErrno("Input must be seekable file (it will be read twice).", ErrorCodes::CANNOT_SEEK_THROUGH_FILE);
+            throw ErrnoException(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Input must be seekable file (it will be read twice)");
 
         SingleReadBufferIterator read_buffer_iterator(std::move(file));
         schema_columns = readSchemaFromFormat(input_format, {}, read_buffer_iterator, false, context_const);
@@ -1336,7 +1336,7 @@ try
         /// stdin must be seekable
         auto res = lseek(file_in.getFD(), 0, SEEK_SET);
         if (-1 == res)
-            throwFromErrno("Input must be seekable file (it will be read twice).", ErrorCodes::CANNOT_SEEK_THROUGH_FILE);
+            throw ErrnoException(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, "Input must be seekable file (it will be read twice)");
     }
 
     Obfuscator obfuscator(header, seed, markov_model_params);
diff --git a/programs/server/Server.cpp b/programs/server/Server.cpp
index 36f0ce90e57..926e57070f3 100644
--- a/programs/server/Server.cpp
+++ b/programs/server/Server.cpp
@@ -45,6 +45,7 @@
 #include <Common/makeSocketAddress.h>
 #include <Common/FailPoint.h>
 #include <Server/waitServersToFinish.h>
+#include <Interpreters/Cache/FileCacheFactory.h>
 #include <Core/ServerUUID.h>
 #include <IO/ReadHelpers.h>
 #include <IO/ReadBufferFromFile.h>
@@ -66,11 +67,12 @@
 #include <Storages/Cache/registerRemoteFileMetadatas.h>
 #include <Common/NamedCollections/NamedCollectionUtils.h>
 #include <AggregateFunctions/registerAggregateFunctions.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
 #include <Functions/registerFunctions.h>
 #include <TableFunctions/registerTableFunctions.h>
 #include <Formats/registerFormats.h>
 #include <Storages/registerStorages.h>
+#include <Databases/registerDatabases.h>
 #include <Dictionaries/registerDictionaries.h>
 #include <Disks/registerDisks.h>
 #include <IO/Resource/registerSchedulerNodes.h>
@@ -92,6 +94,7 @@
 #include <Server/ProxyV1HandlerFactory.h>
 #include <Server/TLSHandlerFactory.h>
 #include <Server/ProtocolServerAdapter.h>
+#include <Server/KeeperReadinessHandler.h>
 #include <Server/HTTP/HTTPServer.h>
 #include <Interpreters/AsynchronousInsertQueue.h>
 #include <Core/ServerSettings.h>
@@ -646,6 +649,7 @@ try
     registerFunctions();
     registerAggregateFunctions();
     registerTableFunctions();
+    registerDatabases();
     registerStorages();
     registerDictionaries();
     registerDisks(/* global_skip_access_check= */ false);
@@ -657,6 +661,11 @@ try
     CurrentMetrics::set(CurrentMetrics::Revision, ClickHouseRevision::getVersionRevision());
     CurrentMetrics::set(CurrentMetrics::VersionInteger, ClickHouseRevision::getVersionInteger());
 
+    Poco::ThreadPool server_pool(3, server_settings.max_connections);
+    std::mutex servers_lock;
+    std::vector<ProtocolServerAdapter> servers;
+    std::vector<ProtocolServerAdapter> servers_to_start_before_tables;
+
     /** Context contains all that query execution is dependent:
       *  settings, available functions, data types, aggregate functions, databases, ...
       */
@@ -697,6 +706,68 @@ try
         server_settings.max_thread_pool_size,
         server_settings.max_thread_pool_free_size,
         server_settings.thread_pool_queue_size);
+    /// Wait for all threads to avoid possible use-after-free (for example logging objects can be already destroyed).
+    SCOPE_EXIT({
+        Stopwatch watch;
+        LOG_INFO(log, "Waiting for background threads");
+        GlobalThreadPool::instance().shutdown();
+        LOG_INFO(log, "Background threads finished in {} ms", watch.elapsedMilliseconds());
+    });
+
+    /// NOTE: global context should be destroyed *before* GlobalThreadPool::shutdown()
+    /// Otherwise GlobalThreadPool::shutdown() will hang, since Context holds some threads.
+    SCOPE_EXIT({
+        /** Ask to cancel background jobs all table engines,
+          *  and also query_log.
+          * It is important to do early, not in destructor of Context, because
+          *  table engines could use Context on destroy.
+          */
+        LOG_INFO(log, "Shutting down storages.");
+
+        global_context->shutdown();
+
+        LOG_DEBUG(log, "Shut down storages.");
+
+        if (!servers_to_start_before_tables.empty())
+        {
+            LOG_DEBUG(log, "Waiting for current connections to servers for tables to finish.");
+            size_t current_connections = 0;
+            {
+                std::lock_guard lock(servers_lock);
+                for (auto & server : servers_to_start_before_tables)
+                {
+                    server.stop();
+                    current_connections += server.currentConnections();
+                }
+            }
+
+            if (current_connections)
+                LOG_INFO(log, "Closed all listening sockets. Waiting for {} outstanding connections.", current_connections);
+            else
+                LOG_INFO(log, "Closed all listening sockets.");
+
+            if (current_connections > 0)
+                current_connections = waitServersToFinish(servers_to_start_before_tables, servers_lock, server_settings.shutdown_wait_unfinished);
+
+            if (current_connections)
+                LOG_INFO(log, "Closed connections to servers for tables. But {} remain. Probably some tables of other users cannot finish their connections after context shutdown.", current_connections);
+            else
+                LOG_INFO(log, "Closed connections to servers for tables.");
+        }
+
+        global_context->shutdownKeeperDispatcher();
+
+        /// Wait server pool to avoid use-after-free of destroyed context in the handlers
+        server_pool.joinAll();
+
+        /** Explicitly destroy Context. It is more convenient than in destructor of Server, because logger is still available.
+          * At this moment, no one could own shared part of Context.
+          */
+        global_context.reset();
+        shared_context.reset();
+        LOG_DEBUG(log, "Destroyed global context.");
+    });
+
 
 #if USE_AZURE_BLOB_STORAGE
     /// It makes sense to deinitialize libxml after joining of all threads
@@ -755,10 +826,6 @@ try
         }
     }
 
-    Poco::ThreadPool server_pool(3, server_settings.max_connections);
-    std::mutex servers_lock;
-    std::vector<ProtocolServerAdapter> servers;
-    std::vector<ProtocolServerAdapter> servers_to_start_before_tables;
     /// This object will periodically calculate some metrics.
     ServerAsynchronousMetrics async_metrics(
         global_context,
@@ -1280,9 +1347,10 @@ try
             global_context->setHTTPHeaderFilter(*config);
 
             global_context->setMaxTableSizeToDrop(server_settings_.max_table_size_to_drop);
-            global_context->setClientHTTPHeaderForbiddenHeaders(server_settings_.get_client_http_header_forbidden_headers);
-            global_context->setAllowGetHTTPHeaderFunction(server_settings_.allow_get_client_http_header);
             global_context->setMaxPartitionSizeToDrop(server_settings_.max_partition_size_to_drop);
+            global_context->setMaxTableNumToWarn(server_settings_.max_table_num_to_warn);
+            global_context->setMaxDatabaseNumToWarn(server_settings_.max_database_num_to_warn);
+            global_context->setMaxPartNumToWarn(server_settings_.max_part_num_to_warn);
 
             ConcurrencyControl::SlotCount concurrent_threads_soft_limit = ConcurrencyControl::Unlimited;
             if (server_settings_.concurrent_threads_soft_limit_num > 0 && server_settings_.concurrent_threads_soft_limit_num < concurrent_threads_soft_limit)
@@ -1385,8 +1453,6 @@ try
 
                 global_context->reloadAuxiliaryZooKeepersConfigIfChanged(config);
 
-                global_context->reloadQueryMaskingRulesIfChanged(config);
-
                 std::lock_guard lock(servers_lock);
                 updateServers(*config, server_pool, async_metrics, servers, servers_to_start_before_tables);
             }
@@ -1407,6 +1473,8 @@ try
 #endif
             NamedCollectionUtils::reloadFromConfig(*config);
 
+            FileCacheFactory::instance().updateSettingsFromConfig(*config);
+
             ProfileEvents::increment(ProfileEvents::MainConfigLoads);
 
             /// Must be the last.
@@ -1490,6 +1558,34 @@ try
                     throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "SSL support for TCP protocol is disabled because Poco library was built without NetSSL support.");
 #endif
                 });
+
+            /// HTTP control endpoints
+            port_name = "keeper_server.http_control.port";
+            createServer(config(), listen_host, port_name, listen_try, /* start_server: */ false,
+            servers_to_start_before_tables,
+            [&](UInt16 port) -> ProtocolServerAdapter
+            {
+                auto http_context = httpContext();
+                Poco::Timespan keep_alive_timeout(config().getUInt("keep_alive_timeout", 10), 0);
+                Poco::Net::HTTPServerParams::Ptr http_params = new Poco::Net::HTTPServerParams;
+                http_params->setTimeout(http_context->getReceiveTimeout());
+                http_params->setKeepAliveTimeout(keep_alive_timeout);
+
+                Poco::Net::ServerSocket socket;
+                auto address = socketBindListen(config(), socket, listen_host, port);
+                socket.setReceiveTimeout(http_context->getReceiveTimeout());
+                socket.setSendTimeout(http_context->getSendTimeout());
+                return ProtocolServerAdapter(
+                    listen_host,
+                    port_name,
+                    "HTTP Control: http://" + address.toString(),
+                    std::make_unique<HTTPServer>(
+                        std::move(http_context),
+                        createKeeperHTTPControlMainHandlerFactory(
+                            config_getter(),
+                            global_context->getKeeperDispatcher(),
+                            "KeeperHTTPControlHandler-factory"), server_pool, socket, http_params));
+            });
         }
 #else
         throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "ClickHouse server built without NuRaft library. Cannot use internal coordination.");
@@ -1600,60 +1696,6 @@ try
     /// try set up encryption. There are some errors in config, error will be printed and server wouldn't start.
     CompressionCodecEncrypted::Configuration::instance().load(config(), "encryption_codecs");
 
-    SCOPE_EXIT({
-        async_metrics.stop();
-
-        /** Ask to cancel background jobs all table engines,
-          *  and also query_log.
-          * It is important to do early, not in destructor of Context, because
-          *  table engines could use Context on destroy.
-          */
-        LOG_INFO(log, "Shutting down storages.");
-
-        global_context->shutdown();
-
-        LOG_DEBUG(log, "Shut down storages.");
-
-        if (!servers_to_start_before_tables.empty())
-        {
-            LOG_DEBUG(log, "Waiting for current connections to servers for tables to finish.");
-            size_t current_connections = 0;
-            {
-                std::lock_guard lock(servers_lock);
-                for (auto & server : servers_to_start_before_tables)
-                {
-                    server.stop();
-                    current_connections += server.currentConnections();
-                }
-            }
-
-            if (current_connections)
-                LOG_INFO(log, "Closed all listening sockets. Waiting for {} outstanding connections.", current_connections);
-            else
-                LOG_INFO(log, "Closed all listening sockets.");
-
-            if (current_connections > 0)
-                current_connections = waitServersToFinish(servers_to_start_before_tables, servers_lock, server_settings.shutdown_wait_unfinished);
-
-            if (current_connections)
-                LOG_INFO(log, "Closed connections to servers for tables. But {} remain. Probably some tables of other users cannot finish their connections after context shutdown.", current_connections);
-            else
-                LOG_INFO(log, "Closed connections to servers for tables.");
-
-            global_context->shutdownKeeperDispatcher();
-        }
-
-        /// Wait server pool to avoid use-after-free of destroyed context in the handlers
-        server_pool.joinAll();
-
-        /** Explicitly destroy Context. It is more convenient than in destructor of Server, because logger is still available.
-          * At this moment, no one could own shared part of Context.
-          */
-        global_context.reset();
-        shared_context.reset();
-        LOG_DEBUG(log, "Destroyed global context.");
-    });
-
     /// DNSCacheUpdater uses BackgroundSchedulePool which lives in shared context
     /// and thus this object must be created after the SCOPE_EXIT object where shared
     /// context is destroyed.
@@ -1716,7 +1758,7 @@ try
         /// After loading validate that default database exists
         database_catalog.assertDatabaseExists(default_database);
         /// Load user-defined SQL functions.
-        global_context->getUserDefinedSQLObjectsLoader().loadObjects();
+        global_context->getUserDefinedSQLObjectsStorage().loadObjects();
     }
     catch (...)
     {
@@ -2088,10 +2130,9 @@ void Server::createServers(
 {
     const Settings & settings = global_context->getSettingsRef();
 
-    Poco::Timespan keep_alive_timeout(config.getUInt("keep_alive_timeout", 10), 0);
     Poco::Net::HTTPServerParams::Ptr http_params = new Poco::Net::HTTPServerParams;
     http_params->setTimeout(settings.http_receive_timeout);
-    http_params->setKeepAliveTimeout(keep_alive_timeout);
+    http_params->setKeepAliveTimeout(global_context->getServerSettings().keep_alive_timeout);
 
     Poco::Util::AbstractConfiguration::Keys protocols;
     config.keys("protocols", protocols);
@@ -2345,10 +2386,9 @@ void Server::createInterserverServers(
 {
     const Settings & settings = global_context->getSettingsRef();
 
-    Poco::Timespan keep_alive_timeout(config.getUInt("keep_alive_timeout", 10), 0);
     Poco::Net::HTTPServerParams::Ptr http_params = new Poco::Net::HTTPServerParams;
     http_params->setTimeout(settings.http_receive_timeout);
-    http_params->setKeepAliveTimeout(keep_alive_timeout);
+    http_params->setKeepAliveTimeout(global_context->getServerSettings().keep_alive_timeout);
 
     /// Now iterate over interserver_listen_hosts
     for (const auto & interserver_listen_host : interserver_listen_hosts)
diff --git a/programs/server/binary.html b/programs/server/binary.html
new file mode 100644
index 00000000000..988dd33a72a
--- /dev/null
+++ b/programs/server/binary.html
@@ -0,0 +1,267 @@
+<!doctype html>
+<html>
+<head>
+    <meta charset="utf-8">
+    <link rel="icon" href="data:image/svg+xml;base64,PHN2ZyB4bWxucz0iaHR0cDovL3d3dy53My5vcmcvMjAwMC9zdmciIHdpZHRoPSI1NCIgaGVpZ2h0PSI0OCIgdmlld0JveD0iMCAwIDkgOCI+PHN0eWxlPi5ve2ZpbGw6I2ZjMH0ucntmaWxsOnJlZH08L3N0eWxlPjxwYXRoIGQ9Ik0wLDcgaDEgdjEgaC0xIHoiIGNsYXNzPSJyIi8+PHBhdGggZD0iTTAsMCBoMSB2NyBoLTEgeiIgY2xhc3M9Im8iLz48cGF0aCBkPSJNMiwwIGgxIHY4IGgtMSB6IiBjbGFzcz0ibyIvPjxwYXRoIGQ9Ik00LDAgaDEgdjggaC0xIHoiIGNsYXNzPSJvIi8+PHBhdGggZD0iTTYsMCBoMSB2OCBoLTEgeiIgY2xhc3M9Im8iLz48cGF0aCBkPSJNOCwzLjI1IGgxIHYxLjUgaC0xIHoiIGNsYXNzPSJvIi8+PC9zdmc+">
+    <title>ClickHouse Binary Viewer</title>
+    <link rel="stylesheet" href="https://cdnjs.cloudflare.com/ajax/libs/leaflet/1.9.4/leaflet.min.css" />
+    <style type="text/css">
+        html, body, #space {
+            width: 100%;
+            height: 100%;
+            padding: 0;
+            margin: 0;
+        }
+
+        #space {
+            background: #111;
+            image-rendering: pixelated;
+        }
+
+        #error {
+            display: none;
+            position: absolute;
+            z-index: 1001;
+            bottom: max(5%, 1em);
+            left: 50%;
+            transform: translate(-50%, 0);
+            background: #300;
+            color: white;
+            font-family: monospace;
+            white-space: pre-wrap;
+            font-size: 16pt;
+            padding: 1em;
+            min-width: 50%;
+            max-width: 80%;
+        }
+
+        .leaflet-fade-anim .leaflet-popup {
+            transition: none;
+            font-family: monospace;
+        }
+
+        .leaflet-control-attribution {
+            font-size: 12pt;
+        }
+    </style>
+</head>
+
+<body>
+    <div id="space"></div>
+    <div id="error"></div>
+
+    <script src="https://cdnjs.cloudflare.com/ajax/libs/leaflet/1.9.4/leaflet.min.js"></script>
+    <script>
+        let host = 'http://localhost:8123/';
+        let user = 'default';
+        let password = '';
+        let add_http_cors_header = true;
+
+        /// If it is hosted on server, assume that it is the address of ClickHouse.
+        if (location.protocol != 'file:') {
+            host = location.origin;
+            user = 'default';
+            add_http_cors_header = false;
+        }
+
+        let map = L.map('space', {
+            crs: L.CRS.Simple,
+            center: [-512, 512],
+            maxBounds: [[128, -128], [-1152, 1152]],
+            zoom: 0,
+        });
+
+        let cached_tiles = {};
+
+        async function render(coords, tile) {
+            const sql = `
+                WITH
+                    bitShiftLeft(1::UInt64, 5 - {z:UInt8})::UInt64 AS zoom_factor,
+
+                    number MOD 1024 AS tile_x,
+                    number DIV 1024 AS tile_y,
+
+                    (zoom_factor * (tile_x + {x:UInt16} * 1024))::UInt16 AS x,
+                    (zoom_factor * (tile_y + {y:UInt16} * 1024))::UInt16 AS y,
+
+                    mortonEncode(x, y) AS addr,
+
+                    extract(demangle(addressToSymbol(addr)), '^[^<]+') AS name,
+                    (empty(name) ? 0 : sipHash64(name)) AS hash,
+                    hash MOD 256 AS r, hash DIV 256 MOD 256 AS g, hash DIV 65536 MOD 256 AS b
+
+                SELECT r::UInt8, g::UInt8, b::UInt8
+                FROM numbers_mt(1024*1024)
+                ORDER BY number`;
+
+            const key = `${coords.z}-${coords.x}-${coords.y}`;
+            let buf = cached_tiles[key];
+            if (!buf) {
+                let url = `${host}?default_format=RowBinary&allow_introspection_functions=1`;
+
+                if (add_http_cors_header) {
+                    // For debug purposes, you may set add_http_cors_header from a browser console
+                    url += '&add_http_cors_header=1';
+                }
+
+                if (user) {
+                    url += `&user=${encodeURIComponent(user)}`;
+                }
+                if (password) {
+                    url += `&password=${encodeURIComponent(password)}`;
+                }
+
+                url += `&param_z=${coords.z}&param_x=${coords.x}&param_y=${coords.y}`;
+                url += `&enable_http_compression=1&network_compression_method=zstd&network_zstd_compression_level=6`;
+
+                const response = await fetch(url, { method: 'POST', body: sql });
+
+                if (!response.ok) {
+                    const text = await response.text();
+                    let err = document.getElementById('error');
+                    err.textContent = text;
+                    err.style.display = 'block';
+                    return;
+                }
+
+                buf = await response.arrayBuffer();
+                cached_tiles[key] = buf;
+            }
+
+            let ctx = tile.getContext('2d');
+            let image = ctx.createImageData(1024, 1024);
+            let arr = new Uint8ClampedArray(buf);
+
+            for (let i = 0; i < 1024 * 1024; ++i) {
+                image.data[i * 4 + 0] = arr[i * 3 + 0];
+                image.data[i * 4 + 1] = arr[i * 3 + 1];
+                image.data[i * 4 + 2] = arr[i * 3 + 2];
+                image.data[i * 4 + 3] = 255;
+            }
+
+            ctx.putImageData(image, 0, 0, 0, 0, 1024, 1024);
+
+            let err = document.getElementById('error');
+            err.style.display = 'none';
+        }
+
+        L.GridLayer.ClickHouse = L.GridLayer.extend({
+            createTile: function(coords, done) {
+                let tile = L.DomUtil.create('canvas', 'leaflet-tile');
+                tile.width = 1024;
+                tile.height = 1024;
+                if (coords.x < 0 || coords.y < 0 || coords.x >= Math.pow(2, coords.z) || coords.y >= Math.pow(2, coords.z)) return tile;
+                render(coords, tile).then(err => done(err, tile));
+                return tile;
+            }
+        });
+
+        let layer = new L.GridLayer.ClickHouse({
+            tileSize: 1024,
+            minZoom: 0,
+            maxZoom: 10,
+            minNativeZoom: 0,
+            maxNativeZoom: 5,
+            attribution: '© ClickHouse, Inc.'
+        });
+
+        layer.addTo(map);
+
+        map.attributionControl.setPrefix('<a href="https://github.com/ClickHouse/ClickHouse/">About</a>');
+
+        function latLngToPixel(latlng) {
+            return { x: ((latlng.lng / 1024) * 32768)|0, y: ((-latlng.lat / 1024) * 32768)|0 };
+        }
+
+        function pixelToLatLng(pixel) {
+            return { lat: (-pixel.y - 0.5) / 32768 * 1024, lng: (pixel.x + 0.5) / 32768 * 1024 };
+        }
+
+        let popup = L.popup({maxWidth: '100%'});
+        let current_requested_addr = '';
+
+        function updateHistory() {
+            const state = {
+                zoom: map.getZoom(),
+                center: latLngToPixel(map.getCenter()),
+            };
+
+            let query = `?zoom=${state.zoom}&x=${state.center.x}&y=${state.center.y}`;
+
+            if (popup.isOpen() && map.getBounds().contains(popup.getLatLng())) {
+                state.popup = latLngToPixel(popup.getLatLng());
+                query += `&px=${state.popup.x}&py=${state.popup.y}`;
+            }
+
+            history.replaceState(state, '', query);
+        }
+
+        window.onpopstate = function(event) {
+            const state = event.state;
+            if (!state) {
+                return;
+            }
+
+            map.setView(pixelToLatLng(state.center), state.zoom);
+
+            if (state.popup) {
+                showPopup(state.popup.x, state.popup.y);
+            }
+        };
+
+        if (window.location.search) {
+            const params = new URLSearchParams(window.location.search);
+
+            map.setView(pixelToLatLng({x: params.get('x')|0, y: params.get('y')|0}), params.get('zoom'));
+
+            if (params.get('px') !== null && params.get('py') !== null) {
+                showPopup(params.get('px')|0, params.get('py')|0);
+            }
+        }
+
+        function showPopup(x, y) {
+            const xn = BigInt(x);
+            const yn = BigInt(y);
+            let addr_int = 0n;
+            for (let bit = 0n; bit < 16n; ++bit) {
+                addr_int |= ((xn >> bit) & 1n) << (bit * 2n);
+                addr_int |= ((yn >> bit) & 1n) << (1n + bit * 2n);
+            }
+
+            current_requested_addr = addr_int;
+
+            const addr_hex = '0x' + addr_int.toString(16);
+            const response = fetch(
+                `http://localhost:8123/?default_format=JSON`,
+                {
+                    method: 'POST',
+                    body: `SELECT encodeXMLComponent(demangle(addressToSymbol(${addr_int}::UInt64))) AS name,
+                                  encodeXMLComponent(addressToLine(${addr_int}::UInt64)) AS line`
+                }).then(response => response.json().then(o => {
+
+                    let name = o.rows ? o.data[0].name : 'nothing';
+                    let line = o.rows ? o.data[0].line : '';
+
+                    if (addr_int == current_requested_addr) {
+                        popup.setContent(`<p><b>${addr_hex}</b></p><p>${name}</p><p>${line}</p>`);
+                    }
+                }));
+
+            popup
+                .setLatLng(pixelToLatLng({x: x, y: y}))
+                .setContent(addr_hex)
+                .openOn(map);
+        }
+
+        map.on('click', e => {
+            const {x, y} = latLngToPixel(e.latlng);
+            if (x < 0 || x >= 32768 || y < 0 || y >= 32768) return;
+
+            showPopup(x, y);
+            updateHistory();
+        });
+
+        map.on('moveend', e => updateHistory());
+    </script>
+</body>
+</html>
diff --git a/programs/server/config.xml b/programs/server/config.xml
index 688f0bf5645..1be20c5cad8 100644
--- a/programs/server/config.xml
+++ b/programs/server/config.xml
@@ -485,7 +485,6 @@
                         <max_data_part_size_bytes></max_data_part_size_bytes>
                         <max_data_part_size_ratio></max_data_part_size_ratio>
                         <perform_ttl_move_on_insert>true</perform_ttl_move_on_insert>
-                        <prefer_not_to_merge>false</prefer_not_to_merge>
                         <load_balancing>round_robin</load_balancing>
                     </main>
                 </volumes>
diff --git a/programs/server/dashboard.html b/programs/server/dashboard.html
index c62e0c98184..04fdfb2d3ca 100644
--- a/programs/server/dashboard.html
+++ b/programs/server/dashboard.html
@@ -455,6 +455,7 @@
             <div id="username-password">
                 <input spellcheck="false" id="user" type="text" value="" placeholder="user" />
                 <input spellcheck="false" id="password" type="password" placeholder="password" />
+                <input id="hidden-submit" type="submit" hidden="true"/>
             </div>
         </div>
         <div id="button-options">
@@ -720,7 +721,7 @@ function insertChart(i) {
     query_editor_confirm.addEventListener('click', editConfirm);
 
     /// Ctrl+Enter (or Cmd+Enter on Mac) will also confirm editing.
-    query_editor.addEventListener('keydown', e => {
+    query_editor.addEventListener('keydown', event => {
         if ((event.metaKey || event.ctrlKey) && (event.keyCode == 13 || event.keyCode == 10)) {
             editConfirm();
         }
@@ -895,7 +896,7 @@ document.getElementById('add').addEventListener('click', e => {
 });
 
 document.getElementById('reload').addEventListener('click', e => {
-    reloadAll(false);
+    reloadAll(queries.length == 0);
 });
 
 document.getElementById('search').addEventListener('click', e => {
@@ -964,12 +965,10 @@ document.getElementById('mass-editor-textarea').addEventListener('input', e => {
 
 function legendAsTooltipPlugin({ className, style = { background: "var(--legend-background)" } } = {}) {
     let legendEl;
-    let showTop = false;
-    const showLimit = 5;
+    let multiline;
 
     function init(u, opts) {
         legendEl = u.root.querySelector(".u-legend");
-
         legendEl.classList.remove("u-inline");
         className && legendEl.classList.add(className);
 
@@ -985,18 +984,19 @@ function legendAsTooltipPlugin({ className, style = { background: "var(--legend-
             ...style
         });
 
+        const nodes = legendEl.querySelectorAll("th");
+        for (let i = 0; i < nodes.length; i++)
+            nodes[i]._order = i;
+
         if (opts.series.length == 2) {
-            const nodes = legendEl.querySelectorAll("th");
+            multiline = false;
             for (let i = 0; i < nodes.length; i++)
                 nodes[i].style.display = "none";
         } else {
+            multiline = true;
             legendEl.querySelector("th").remove();
             legendEl.querySelector("td").setAttribute('colspan', '2');
             legendEl.querySelector("td").style.textAlign = 'center';
-        }
-
-        if (opts.series.length - 1 > showLimit) {
-            showTop = true;
             let footer = legendEl.insertRow().insertCell();
             footer.setAttribute('colspan', '2');
             footer.style.textAlign = 'center';
@@ -1023,18 +1023,20 @@ function legendAsTooltipPlugin({ className, style = { background: "var(--legend-
         left -= legendEl.clientWidth / 2;
         top -= legendEl.clientHeight / 2;
         legendEl.style.transform = "translate(" + left + "px, " + top + "px)";
-        if (showTop) {
+
+        if (multiline) {
             let nodes = nodeListToArray(legendEl.querySelectorAll("tr"));
             let header = nodes.shift();
             let footer = nodes.pop();
-            nodes.forEach(function (node) { node._sort_key = +node.querySelector("td").textContent; });
-            nodes.sort((a, b) => +b._sort_key - +a._sort_key);
+            let showLimit = Math.floor(u.height / 30);
+            nodes.forEach(function (node) { node._sort_key = nodes.length > showLimit ? +node.querySelector("td").textContent.replace(/,/g,'') : node._order; });
+            nodes.sort((a, b) => b._sort_key - a._sort_key);
             nodes.forEach(function (node) { node.parentNode.appendChild(node); });
             for (let i = 0; i < nodes.length; i++) {
                 nodes[i].style.display = i < showLimit ? null : "none";
-                delete nodes[i]._sort_key;
             }
             footer.parentNode.appendChild(footer);
+            footer.style.display = nodes.length > showLimit ? null : "none";
         }
     }
 
@@ -1291,6 +1293,7 @@ async function drawAll() {
             document.getElementById('add').style.display = 'inline-block';
             document.getElementById('edit').style.display = 'inline-block';
             document.getElementById('search-span').style.display = '';
+            hideError();
         }
         else {
             const charts = document.getElementById('charts')
@@ -1317,9 +1320,11 @@ function disableButtons() {
     reloadButton.classList.add('disabled');
 
     const runButton = document.getElementById('run');
-    runButton.value = 'Reloading…';
-    runButton.disabled = true;
-    runButton.classList.add('disabled');
+    if (runButton) {
+        runButton.value = 'Reloading…';
+        runButton.disabled = true;
+        runButton.classList.add('disabled');
+    }
 
     const searchButton = document.getElementById('search');
     searchButton.value = '…';
@@ -1334,9 +1339,11 @@ function enableButtons() {
     reloadButton.classList.remove('disabled');
 
     const runButton = document.getElementById('run');
-    runButton.value = 'Ok';
-    runButton.disabled = false;
-    runButton.classList.remove('disabled');
+    if (runButton) {
+        runButton.value = 'Ok';
+        runButton.disabled = false;
+        runButton.classList.remove('disabled');
+    }
 
     const searchButton = document.getElementById('search');
     searchButton.value = '🔎';
@@ -1359,14 +1366,17 @@ async function reloadAll(do_search) {
         }
         await drawAll();
     } catch (e) {
-        showError(e.toString());
+        showError(e.message);
     }
     enableButtons();
 }
 
 document.getElementById('params').onsubmit = function(event) {
-    let do_search = document.activeElement === document.getElementById('search-query');
-    reloadAll(do_search);
+    if (document.activeElement === document.getElementById('search-query')) {
+        reloadAll(true);
+    } else {
+        reloadAll(queries.length == 0);
+    }
     event.preventDefault();
 }
 
@@ -1405,13 +1415,15 @@ function refreshCustomized(value) {
     document.getElementById('search-span').style.opacity = customized ? 0.5 : 1.0;
 }
 
-function regenerate() {
+function updateFromState() {
     document.getElementById('url').value = host;
     document.getElementById('user').value = user;
     document.getElementById('password').value = password;
     document.getElementById('search-query').value = search_query;
     refreshCustomized();
+}
 
+function regenerate() {
     findParamsInQueries();
     buildParams();
 
@@ -1430,7 +1442,7 @@ function regenerate() {
 window.onpopstate = function(event) {
     if (!event.state) { return; }
     ({host, user, queries, params, search_query, customized} = event.state);
-
+    updateFromState();
     regenerate();
     drawAll();
 };
@@ -1447,6 +1459,7 @@ if (window.location.hash) {
 
 async function start() {
     try {
+        updateFromState();
         if (queries.length == 0) {
             await searchQueries();
         } else {
@@ -1460,7 +1473,7 @@ async function start() {
             drawAll();
         }
     } catch (e) {
-        showError(e.toString());
+        showError(e.message);
     }
 }
 
diff --git a/programs/su/su.cpp b/programs/su/su.cpp
index cebd05b3eb1..a8f61fb32b6 100644
--- a/programs/su/su.cpp
+++ b/programs/su/su.cpp
@@ -56,7 +56,7 @@ void setUserAndGroup(std::string arg_uid, std::string arg_gid)
             group * result{};
 
             if (0 != getgrnam_r(arg_gid.data(), &entry, buf.get(), buf_size, &result))
-                throwFromErrno(fmt::format("Cannot do 'getgrnam_r' to obtain gid from group name ({})", arg_gid), ErrorCodes::SYSTEM_ERROR);
+                throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot do 'getgrnam_r' to obtain gid from group name ({})", arg_gid);
 
             if (!result)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Group {} is not found in the system", arg_gid);
@@ -68,7 +68,7 @@ void setUserAndGroup(std::string arg_uid, std::string arg_gid)
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Group has id 0, but dropping privileges to gid 0 does not make sense");
 
         if (0 != setgid(gid))
-            throwFromErrno(fmt::format("Cannot do 'setgid' to user ({})", arg_gid), ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot do 'setgid' to user ({})", arg_gid);
     }
 
     if (!arg_uid.empty())
@@ -81,7 +81,7 @@ void setUserAndGroup(std::string arg_uid, std::string arg_gid)
             passwd * result{};
 
             if (0 != getpwnam_r(arg_uid.data(), &entry, buf.get(), buf_size, &result))
-                throwFromErrno(fmt::format("Cannot do 'getpwnam_r' to obtain uid from user name ({})", arg_uid), ErrorCodes::SYSTEM_ERROR);
+                throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot do 'getpwnam_r' to obtain uid from user name ({})", arg_uid);
 
             if (!result)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "User {} is not found in the system", arg_uid);
@@ -93,7 +93,7 @@ void setUserAndGroup(std::string arg_uid, std::string arg_gid)
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "User has id 0, but dropping privileges to uid 0 does not make sense");
 
         if (0 != setuid(uid))
-            throwFromErrno(fmt::format("Cannot do 'setuid' to user ({})", arg_uid), ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot do 'setuid' to user ({})", arg_uid);
     }
 }
 
@@ -136,7 +136,7 @@ try
 
     execvp(new_argv.front(), new_argv.data());
 
-    throwFromErrno("Cannot execvp", ErrorCodes::SYSTEM_ERROR);
+    throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot execvp");
 }
 catch (...)
 {
diff --git a/rust/BLAKE3/CMakeLists.txt b/rust/BLAKE3/CMakeLists.txt
deleted file mode 100644
index ceb0a647b66..00000000000
--- a/rust/BLAKE3/CMakeLists.txt
+++ /dev/null
@@ -1,3 +0,0 @@
-clickhouse_import_crate(MANIFEST_PATH Cargo.toml)
-target_include_directories(_ch_rust_blake3 INTERFACE include)
-add_library(ch_rust::blake3 ALIAS _ch_rust_blake3)
diff --git a/rust/BLAKE3/Cargo.toml b/rust/BLAKE3/Cargo.toml
deleted file mode 100644
index ed414fa54c1..00000000000
--- a/rust/BLAKE3/Cargo.toml
+++ /dev/null
@@ -1,20 +0,0 @@
-[package]
-name = "_ch_rust_blake3"
-version = "0.1.0"
-
-# See more keys and their definitions at https://doc.rust-lang.org/cargo/reference/manifest.html
-
-[dependencies]
-blake3 = "1.2.0"
-libc = "0.2.132"
-
-[lib]
-crate-type = ["staticlib"]
-
-[profile.release]
-debug = true
-
-[profile.release-thinlto]
-inherits = "release"
-# BLAKE3 module requires "full" LTO (not "thin") to get additional 10% performance benefit
-lto = true
diff --git a/rust/BLAKE3/include/blake3.h b/rust/BLAKE3/include/blake3.h
deleted file mode 100644
index 5dc7d5bd902..00000000000
--- a/rust/BLAKE3/include/blake3.h
+++ /dev/null
@@ -1,15 +0,0 @@
-#ifndef BLAKE3_H
-#define BLAKE3_H
-
-#include <cstdint>
-
-
-extern "C" {
-
-char *blake3_apply_shim(const char *begin, uint32_t _size, uint8_t *out_char_data);
-
-void blake3_free_char_pointer(char *ptr_to_free);
-
-} // extern "C"
-
-#endif /* BLAKE3_H */
diff --git a/rust/BLAKE3/src/lib.rs b/rust/BLAKE3/src/lib.rs
deleted file mode 100644
index 011145d2f71..00000000000
--- a/rust/BLAKE3/src/lib.rs
+++ /dev/null
@@ -1,30 +0,0 @@
-extern crate blake3;
-extern crate libc;
-
-use std::ffi::{CStr, CString};
-use std::os::raw::c_char;
-
-#[no_mangle]
-pub unsafe extern "C" fn blake3_apply_shim(
-    begin: *const c_char,
-    _size: u32,
-    out_char_data: *mut u8,
-) -> *mut c_char {
-    if begin.is_null() {
-        let err_str = CString::new("input was a null pointer").unwrap();
-        return err_str.into_raw();
-    }
-    let mut hasher = blake3::Hasher::new();
-    let input_bytes = CStr::from_ptr(begin);
-    let input_res = input_bytes.to_bytes();
-    hasher.update(input_res);
-    let mut reader = hasher.finalize_xof();
-    reader.fill(std::slice::from_raw_parts_mut(out_char_data, blake3::OUT_LEN));
-    std::ptr::null_mut()
-}
-
-// Freeing memory according to docs: https://doc.rust-lang.org/std/ffi/struct.CString.html#method.into_raw
-#[no_mangle]
-pub unsafe extern "C" fn blake3_free_char_pointer(ptr_to_free: *mut c_char) {
-    std::mem::drop(CString::from_raw(ptr_to_free));
-}
diff --git a/rust/CMakeLists.txt b/rust/CMakeLists.txt
index 6aa25e95679..66694ee16f8 100644
--- a/rust/CMakeLists.txt
+++ b/rust/CMakeLists.txt
@@ -14,6 +14,10 @@ macro(configure_rustc)
         set(RUST_CFLAGS "${RUST_CFLAGS} --sysroot ${CMAKE_SYSROOT}")
     endif()
 
+    if (USE_MUSL)
+        set(RUST_CXXFLAGS "${RUST_CXXFLAGS} -D_LIBCPP_HAS_MUSL_LIBC=1")
+    endif ()
+
     if(CCACHE_EXECUTABLE MATCHES "/sccache$")
         message(STATUS "Using RUSTC_WRAPPER: ${CCACHE_EXECUTABLE}")
         set(RUSTCWRAPPER "rustc-wrapper = \"${CCACHE_EXECUTABLE}\"")
@@ -95,6 +99,5 @@ function(add_rust_subdirectory src)
         VERBATIM)
 endfunction()
 
-add_rust_subdirectory (BLAKE3)
 add_rust_subdirectory (skim)
 add_rust_subdirectory (prql)
diff --git a/rust/Cargo.lock b/rust/Cargo.lock
index 04569cd3b3a..86bbec5579f 100644
--- a/rust/Cargo.lock
+++ b/rust/Cargo.lock
@@ -2,14 +2,6 @@
 # It is not intended for manual editing.
 version = 3
 
-[[package]]
-name = "_ch_rust_blake3"
-version = "0.1.0"
-dependencies = [
- "blake3",
- "libc",
-]
-
 [[package]]
 name = "_ch_rust_prql"
 version = "0.1.0"
@@ -30,9 +22,9 @@ dependencies = [
 
 [[package]]
 name = "addr2line"
-version = "0.20.0"
+version = "0.21.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f4fa78e18c64fce05e902adecd7a5eed15a5e0a3439f7b0e169f0252214865e3"
+checksum = "8a30b2e23b9e17a9f90641c7ab1549cd9b44f296d3ccbf309d2863cfe398a0cb"
 dependencies = [
  "gimli",
 ]
@@ -45,24 +37,31 @@ checksum = "f26201604c87b1e01bd3d98f8d5d9a8fcbb815e8cedb41ffccbeb4bf593a35fe"
 
 [[package]]
 name = "ahash"
-version = "0.7.6"
+version = "0.8.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fcb51a0695d8f838b1ee009b3fbf66bda078cd64590202a864a8f3e8c4315c47"
+checksum = "91429305e9f0a25f6205c5b8e0d2db09e0708a7a6df0f42212bb56c32c8ac97a"
 dependencies = [
- "getrandom",
+ "cfg-if",
  "once_cell",
  "version_check",
+ "zerocopy",
 ]
 
 [[package]]
 name = "aho-corasick"
-version = "1.0.2"
+version = "1.1.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "43f6cb1bf222025340178f382c426f13757b2960e89779dfcb319c32542a5a41"
+checksum = "b2969dcb958b36655471fc61f7e416fa76033bdd4bfed0678d8fee1e2d07a1f0"
 dependencies = [
  "memchr",
 ]
 
+[[package]]
+name = "allocator-api2"
+version = "0.2.16"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "0942ffc6dcaadf03badf6e6a2d0228460359d5e34b57ccdc720b7382dfbd5ec5"
+
 [[package]]
 name = "android-tzdata"
 version = "0.1.1"
@@ -95,43 +94,43 @@ dependencies = [
 
 [[package]]
 name = "anstyle"
-version = "1.0.1"
+version = "1.0.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3a30da5c5f2d5e72842e00bcb57657162cdabef0931f40e2deb9b4140440cecd"
+checksum = "7079075b41f533b8c61d2a4d073c4676e1f8b249ff94a393b0595db304e0dd87"
 
 [[package]]
 name = "anstyle-parse"
-version = "0.2.1"
+version = "0.2.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "938874ff5980b03a87c5524b3ae5b59cf99b1d6bc836848df7bc5ada9643c333"
+checksum = "c75ac65da39e5fe5ab759307499ddad880d724eed2f6ce5b5e8a26f4f387928c"
 dependencies = [
  "utf8parse",
 ]
 
 [[package]]
 name = "anstyle-query"
-version = "1.0.0"
+version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5ca11d4be1bab0c8bc8734a9aa7bf4ee8316d462a08c6ac5052f888fef5b494b"
+checksum = "e28923312444cdd728e4738b3f9c9cac739500909bb3d3c94b43551b16517648"
 dependencies = [
- "windows-sys",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
 name = "anstyle-wincon"
-version = "1.0.1"
+version = "1.0.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "180abfa45703aebe0093f79badacc01b8fd4ea2e35118747e5811127f926e188"
+checksum = "c677ab05e09154296dd37acecd46420c17b9713e8366facafa8fc0885167cf4c"
 dependencies = [
  "anstyle",
- "windows-sys",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]
 name = "anyhow"
-version = "1.0.72"
+version = "1.0.75"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3b13c32d80ecc7ab747b80c3784bce54ee8a7a0cc4fbda9bf4cda2cf6fe90854"
+checksum = "a4668cab20f66d8d020e1fbc0ebe47217433c1b6c8f2040faf858554e394ace6"
 dependencies = [
  "backtrace",
 ]
@@ -146,12 +145,6 @@ dependencies = [
  "yansi",
 ]
 
-[[package]]
-name = "arrayref"
-version = "0.3.7"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6b4930d2cb77ce62f89ee5d5289b4ac049559b1c45539271f5ed4fdc7db34545"
-
 [[package]]
 name = "arrayvec"
 version = "0.7.4"
@@ -166,9 +159,9 @@ checksum = "d468802bab17cbc0cc575e9b053f41e72aa36bfa6b7f55e3529ffa43161b97fa"
 
 [[package]]
 name = "backtrace"
-version = "0.3.68"
+version = "0.3.69"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4319208da049c43661739c5fade2ba182f09d1dc2299b32298d3a31692b17e12"
+checksum = "2089b7e3f35b9dd2d0ed921ead4f6d318c27680d4a5bd167b3ee120edb105837"
 dependencies = [
  "addr2line",
  "cc",
@@ -193,44 +186,24 @@ checksum = "bef38d45163c2f1dde094a7dfd33ccf595c92905c8f8f4fdc18d06fb1037718a"
 
 [[package]]
 name = "bitflags"
-version = "2.3.3"
+version = "2.4.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "630be753d4e58660abd17930c71b647fe46c27ea6b63cc59e1e3851406972e42"
-
-[[package]]
-name = "blake3"
-version = "1.4.1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "199c42ab6972d92c9f8995f086273d25c42fc0f7b2a1fcefba465c1352d25ba5"
-dependencies = [
- "arrayref",
- "arrayvec",
- "cc",
- "cfg-if",
- "constant_time_eq",
- "digest",
-]
-
-[[package]]
-name = "block-buffer"
-version = "0.10.4"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3078c7629b62d3f0439517fa394996acacc5cbc91c5a20d8c658e77abd503a71"
-dependencies = [
- "generic-array",
-]
+checksum = "327762f6e5a765692301e5bb513e0d9fef63be86bbc14528052b1cd3e6f03e07"
 
 [[package]]
 name = "bumpalo"
-version = "3.13.0"
+version = "3.14.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a3e2c3daef883ecc1b5d58c15adae93470a91d425f3532ba1695849656af3fc1"
+checksum = "7f30e7476521f6f8af1a1c4c0b8cc94f0bee37d91763d0ca2665f299b6cd8aec"
 
 [[package]]
 name = "cc"
-version = "1.0.79"
+version = "1.0.83"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "50d30906286121d95be3d479533b458f87493b30a4b5f79a607db8f5d11aa91f"
+checksum = "f1174fb0b6ec23863f8b971027804a42614e347eafb0a95bf0b12cdae21fc4d0"
+dependencies = [
+ "libc",
+]
 
 [[package]]
 name = "cfg-if"
@@ -240,24 +213,23 @@ checksum = "baf1de4339761588bc0619e3cbc0120ee582ebb74b53b4efbf79117bd2da40fd"
 
 [[package]]
 name = "chrono"
-version = "0.4.26"
+version = "0.4.31"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ec837a71355b28f6556dbd569b37b3f363091c0bd4b2e735674521b4c5fd9bc5"
+checksum = "7f2c685bad3eb3d45a01354cedb7d5faa66194d1d58ba6e267a8de788f79db38"
 dependencies = [
  "android-tzdata",
  "iana-time-zone",
  "js-sys",
  "num-traits",
- "time 0.1.45",
  "wasm-bindgen",
- "winapi",
+ "windows-targets 0.48.5",
 ]
 
 [[package]]
 name = "chumsky"
-version = "0.9.2"
+version = "0.9.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "23170228b96236b5a7299057ac284a321457700bc8c41a4476052f0f4ba5349d"
+checksum = "8eebd66744a15ded14960ab4ccdbfb51ad3b81f51f3f04a80adac98c985396c9"
 dependencies = [
  "hashbrown",
  "stacker",
@@ -279,17 +251,11 @@ version = "1.0.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "acbf1af155f9b9ef647e42cdc158db4b64a1b61f743629225fde6f3e0be2a7c7"
 
-[[package]]
-name = "constant_time_eq"
-version = "0.3.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f7144d30dcf0fafbce74250a3963025d8d52177934239851c917d29f1df280c2"
-
 [[package]]
 name = "core-foundation-sys"
-version = "0.8.4"
+version = "0.8.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e496a50fda8aacccc86d7529e2c1e0892dbd0f898a6b5645b5561b89c3210efa"
+checksum = "06ea2b9bc92be3c2baa9334a323ebca2d6f074ff852cd1d7b11064035cd3868f"
 
 [[package]]
 name = "crossbeam"
@@ -307,9 +273,9 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-channel"
-version = "0.5.8"
+version = "0.5.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "a33c2bf77f2df06183c3aa30d1e96c0695a313d4f9c453cc3762a6db39f99200"
+checksum = "14c3242926edf34aec4ac3a77108ad4854bffaa2e4ddc1824124ce59231302d5"
 dependencies = [
  "cfg-if",
  "crossbeam-utils",
@@ -317,9 +283,9 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-deque"
-version = "0.8.3"
+version = "0.8.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ce6fd6f855243022dcecf8702fef0c297d4338e226845fe067f6341ad9fa0cef"
+checksum = "fca89a0e215bab21874660c67903c5f143333cab1da83d041c7ded6053774751"
 dependencies = [
  "cfg-if",
  "crossbeam-epoch",
@@ -328,22 +294,21 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-epoch"
-version = "0.9.15"
+version = "0.9.16"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ae211234986c545741a7dc064309f67ee1e5ad243d0e48335adc0484d960bcc7"
+checksum = "2d2fe95351b870527a5d09bf563ed3c97c0cffb87cf1c78a591bf48bb218d9aa"
 dependencies = [
  "autocfg",
  "cfg-if",
  "crossbeam-utils",
  "memoffset 0.9.0",
- "scopeguard",
 ]
 
 [[package]]
 name = "crossbeam-queue"
-version = "0.3.8"
+version = "0.3.9"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d1cfb3ea8a53f37c40dea2c7bedcbd88bdfae54f5e2175d6ecaff1c988353add"
+checksum = "b9bcf5bdbfdd6030fb4a1c497b5d5fc5921aa2f60d359a17e249c0e6df3de153"
 dependencies = [
  "cfg-if",
  "crossbeam-utils",
@@ -351,28 +316,18 @@ dependencies = [
 
 [[package]]
 name = "crossbeam-utils"
-version = "0.8.16"
+version = "0.8.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5a22b2d63d4d1dc0b7f1b6b2747dd0088008a9be28b6ddf0b1e7d335e3037294"
+checksum = "c06d96137f14f244c37f989d9fff8f95e6c18b918e71f36638f8c49112e4c78f"
 dependencies = [
  "cfg-if",
 ]
 
-[[package]]
-name = "crypto-common"
-version = "0.1.6"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1bfb12502f3fc46cca1bb51ac28df9d618d813cdc3d2f25b9fe775a34af26bb3"
-dependencies = [
- "generic-array",
- "typenum",
-]
-
 [[package]]
 name = "csv"
-version = "1.2.2"
+version = "1.3.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "626ae34994d3d8d668f4269922248239db4ae42d538b14c398b74a52208e8086"
+checksum = "ac574ff4d437a7b5ad237ef331c17ccca63c46479e5b5453eb8e10bb99a759fe"
 dependencies = [
  "csv-core",
  "itoa",
@@ -382,18 +337,18 @@ dependencies = [
 
 [[package]]
 name = "csv-core"
-version = "0.1.10"
+version = "0.1.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2b2466559f260f48ad25fe6317b3c8dac77b5bdb5763ac7d9d6103530663bc90"
+checksum = "5efa2b3d7902f4b634a20cae3c9c4e6209dc4779feb6863329607560143efa70"
 dependencies = [
  "memchr",
 ]
 
 [[package]]
 name = "cxx"
-version = "1.0.102"
+version = "1.0.111"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f68e12e817cb19eaab81aaec582b4052d07debd3c3c6b083b9d361db47c7dc9d"
+checksum = "e9fc0c733f71e58dedf4f034cd2a266f80b94cc9ed512729e1798651b68c2cba"
 dependencies = [
  "cc",
  "cxxbridge-flags",
@@ -403,9 +358,9 @@ dependencies = [
 
 [[package]]
 name = "cxx-build"
-version = "1.0.102"
+version = "1.0.111"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e789217e4ab7cf8cc9ce82253180a9fe331f35f5d339f0ccfe0270b39433f397"
+checksum = "51bc81d2664db24cf1d35405f66e18a85cffd4d49ab930c71a5c6342a410f38c"
 dependencies = [
  "cc",
  "codespan-reporting",
@@ -413,24 +368,24 @@ dependencies = [
  "proc-macro2",
  "quote",
  "scratch",
- "syn 2.0.27",
+ "syn 2.0.41",
 ]
 
 [[package]]
 name = "cxxbridge-flags"
-version = "1.0.102"
+version = "1.0.111"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "78a19f4c80fd9ab6c882286fa865e92e07688f4387370a209508014ead8751d0"
+checksum = "8511afbe34ea242697784da5cb2c5d4a0afb224ca8b136bdf93bfe180cbe5884"
 
 [[package]]
 name = "cxxbridge-macro"
-version = "1.0.102"
+version = "1.0.111"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b8fcfa71f66c8563c4fa9dd2bb68368d50267856f831ac5d85367e0805f9606c"
+checksum = "5c6888cd161769d65134846d4d4981d5a6654307cc46ec83fb917e530aea5f84"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.27",
+ "syn 2.0.41",
 ]
 
 [[package]]
@@ -478,6 +433,15 @@ dependencies = [
  "once_cell",
 ]
 
+[[package]]
+name = "deranged"
+version = "0.3.10"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8eb30d70a07a3b04884d2677f06bec33509dc67ca60d92949e5535352d3191dc"
+dependencies = [
+ "powerfmt",
+]
+
 [[package]]
 name = "derive_builder"
 version = "0.11.2"
@@ -509,17 +473,6 @@ dependencies = [
  "syn 1.0.109",
 ]
 
-[[package]]
-name = "digest"
-version = "0.10.7"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "9ed9a281f7bc9b7576e61468ba615a66a5c8cfdff42420a70aa82701a3b1e292"
-dependencies = [
- "block-buffer",
- "crypto-common",
- "subtle",
-]
-
 [[package]]
 name = "dirs-next"
 version = "2.0.0"
@@ -556,28 +509,17 @@ dependencies = [
  "heck",
  "proc-macro2",
  "quote",
- "syn 2.0.27",
+ "syn 2.0.41",
 ]
 
 [[package]]
 name = "errno"
-version = "0.3.2"
+version = "0.3.8"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6b30f669a7961ef1631673d2766cc92f52d64f7ef354d4fe0ddfd30ed52f0f4f"
+checksum = "a258e46cdc063eb8519c00b9fc845fc47bcfca4130e2f08e88665ceda8474245"
 dependencies = [
- "errno-dragonfly",
- "libc",
- "windows-sys",
-]
-
-[[package]]
-name = "errno-dragonfly"
-version = "0.1.2"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "aa68f1b12764fab894d2755d2518754e71b4fd80ecfb822714a1206c2aab39bf"
-dependencies = [
- "cc",
  "libc",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
@@ -595,40 +537,31 @@ dependencies = [
  "thread_local",
 ]
 
-[[package]]
-name = "generic-array"
-version = "0.14.7"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "85649ca51fd72272d7821adaf274ad91c288277713d9c18820d8499a7ff69e9a"
-dependencies = [
- "typenum",
- "version_check",
-]
-
 [[package]]
 name = "getrandom"
-version = "0.2.10"
+version = "0.2.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "be4136b2a15dd319360be1c07d9933517ccf0be8f16bf62a3bee4f0d618df427"
+checksum = "fe9006bed769170c11f845cf00c7c1e9092aeb3f268e007c3e760ac68008070f"
 dependencies = [
  "cfg-if",
  "libc",
- "wasi 0.11.0+wasi-snapshot-preview1",
+ "wasi",
 ]
 
 [[package]]
 name = "gimli"
-version = "0.27.3"
+version = "0.28.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b6c80984affa11d98d1b88b66ac8853f143217b399d3c74116778ff8fdb4ed2e"
+checksum = "4271d37baee1b8c7e4b708028c57d816cf9d2434acb33a549475f78c181f6253"
 
 [[package]]
 name = "hashbrown"
-version = "0.12.3"
+version = "0.14.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8a9ee70c43aaf417c914396645a0fa852624801b24ebb7ae78fe8272889ac888"
+checksum = "290f1a1d9242c78d09ce40a5e87e7554ee637af1351968159f4952f028f75604"
 dependencies = [
  "ahash",
+ "allocator-api2",
 ]
 
 [[package]]
@@ -639,22 +572,22 @@ checksum = "95505c38b4572b2d910cecb0281560f54b440a19336cbbcb27bf6ce6adc6f5a8"
 
 [[package]]
 name = "hermit-abi"
-version = "0.3.2"
+version = "0.3.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "443144c8cdadd93ebf52ddb4056d257f5b52c04d3c804e657d19eb73fc33668b"
+checksum = "d77f7ec81a6d05a3abb01ab6eb7590f6083d08449fe5a1c8b1e620283546ccb7"
 
 [[package]]
 name = "iana-time-zone"
-version = "0.1.57"
+version = "0.1.58"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2fad5b825842d2b38bd206f3e81d6957625fd7f0a361e345c30e01a0ae2dd613"
+checksum = "8326b86b6cff230b97d0d312a6c40a60726df3332e721f72a1b035f451663b20"
 dependencies = [
  "android_system_properties",
  "core-foundation-sys",
  "iana-time-zone-haiku",
  "js-sys",
  "wasm-bindgen",
- "windows",
+ "windows-core",
 ]
 
 [[package]]
@@ -680,16 +613,7 @@ checksum = "cb0889898416213fab133e1d33a0e5858a48177452750691bde3666d0fdbaf8b"
 dependencies = [
  "hermit-abi",
  "rustix",
- "windows-sys",
-]
-
-[[package]]
-name = "itertools"
-version = "0.10.5"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b0fd2260e829bddf4cb6ea802289de2f86d6a7a690192fbe91b3f46e0f2c8473"
-dependencies = [
- "either",
+ "windows-sys 0.48.0",
 ]
 
 [[package]]
@@ -702,16 +626,25 @@ dependencies = [
 ]
 
 [[package]]
-name = "itoa"
-version = "1.0.9"
+name = "itertools"
+version = "0.12.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "af150ab688ff2122fcef229be89cb50dd66af9e01a4ff320cc137eecc9bacc38"
+checksum = "25db6b064527c5d482d0423354fcd07a89a2dfe07b67892e62411946db7f07b0"
+dependencies = [
+ "either",
+]
+
+[[package]]
+name = "itoa"
+version = "1.0.10"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b1a46d1a171d865aa5f83f92695765caa047a9b4cbae2cbf37dbd613a793fd4c"
 
 [[package]]
 name = "js-sys"
-version = "0.3.64"
+version = "0.3.66"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c5f195fe497f702db0f318b07fdd68edb16955aed830df8363d837542f8f935a"
+checksum = "cee9c64da59eae3b50095c18d3e74f8b73c0b86d2792824ff01bbce68ba229ca"
 dependencies = [
  "wasm-bindgen",
 ]
@@ -724,9 +657,20 @@ checksum = "e2abad23fbc42b3700f2f279844dc832adb2b2eb069b2df918f455c4e18cc646"
 
 [[package]]
 name = "libc"
-version = "0.2.147"
+version = "0.2.151"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b4668fb0ea861c1df094127ac5f1da3409a82116a4ba74fca2e58ef927159bb3"
+checksum = "302d7ab3130588088d277783b1e2d2e10c9e9e4a16dd9050e6ec93fb3e7048f4"
+
+[[package]]
+name = "libredox"
+version = "0.0.1"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "85c833ca1e66078851dba29046874e38f08b2c883700aa29a03ddd3b23814ee8"
+dependencies = [
+ "bitflags 2.4.1",
+ "libc",
+ "redox_syscall",
+]
 
 [[package]]
 name = "link-cplusplus"
@@ -739,21 +683,21 @@ dependencies = [
 
 [[package]]
 name = "linux-raw-sys"
-version = "0.4.5"
+version = "0.4.12"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "57bcfdad1b858c2db7c38303a6d2ad4dfaf5eb53dfeb0910128b2c26d6158503"
+checksum = "c4cd1a83af159aa67994778be9070f0ae1bd732942279cabb14f86f986a21456"
 
 [[package]]
 name = "log"
-version = "0.4.19"
+version = "0.4.20"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b06a4cde4c0f271a446782e3eff8de789548ce57dbc8eca9292c27f4a42004b4"
+checksum = "b5e6163cb8c49088c2c36f57875e58ccd8c87c7427f7fbd50ea6710b2f3f2e8f"
 
 [[package]]
 name = "memchr"
-version = "2.5.0"
+version = "2.6.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2dffe52ecf27772e601905b7522cb4ef790d2cc203488bbd0e2fe85fcb74566d"
+checksum = "f665ee40bc4a3c5590afb1e9677db74a508659dfd71e126420da8274909a0167"
 
 [[package]]
 name = "memoffset"
@@ -825,37 +769,27 @@ dependencies = [
 
 [[package]]
 name = "num-traits"
-version = "0.2.16"
+version = "0.2.17"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "f30b0abd723be7e2ffca1272140fac1a2f084c77ec3e123c192b66af1ee9e6c2"
+checksum = "39e3200413f237f41ab11ad6d161bc7239c84dcb631773ccd7de3dfe4b5c267c"
 dependencies = [
  "autocfg",
 ]
 
-[[package]]
-name = "num_cpus"
-version = "1.16.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4161fcb6d602d4d2081af7c3a45852d875a03dd337a6bfdd6e06407b61342a43"
-dependencies = [
- "hermit-abi",
- "libc",
-]
-
 [[package]]
 name = "object"
-version = "0.31.1"
+version = "0.32.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "8bda667d9f2b5051b8833f59f3bf748b28ef54f850f4fcb389a252aa383866d1"
+checksum = "9cf5f9dd3933bd50a9e1f149ec995f39ae2c496d31fd772c1fd45ebc27e902b0"
 dependencies = [
  "memchr",
 ]
 
 [[package]]
 name = "once_cell"
-version = "1.18.0"
+version = "1.19.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dd8b5dd2ae5ed71462c540258bedcb51965123ad7e7ccf4b9a8cafaa4a63576d"
+checksum = "3fdb12b2476b595f9358c5161aa467c2438859caa136dec86c26fdd2efe17b92"
 
 [[package]]
 name = "pin-utils"
@@ -864,19 +798,25 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "8b870d8c151b6f2fb93e84a13146138f05d02ed11c7e7c54f8826aaaf7c9f184"
 
 [[package]]
-name = "proc-macro2"
-version = "1.0.66"
+name = "powerfmt"
+version = "0.2.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "18fb31db3f9bddb2ea821cde30a9f70117e3f119938b5ee630b7403aa6e2ead9"
+checksum = "439ee305def115ba05938db6eb1644ff94165c5ab5e9420d1c1bcedbba909391"
+
+[[package]]
+name = "proc-macro2"
+version = "1.0.70"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "39278fbbf5fb4f646ce651690877f89d1c5811a3d4acb27700c1cb3cdb78fd3b"
 dependencies = [
  "unicode-ident",
 ]
 
 [[package]]
 name = "prql-ast"
-version = "0.9.3"
+version = "0.9.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "71194e75f14dbe7debdf2b5eca0812c978021a1bd23d6fe1da98b58e407e035a"
+checksum = "d9d91522f9f16d055409b9ffec55693a96e3424fe5d8e7c8331adcf6d7ee363a"
 dependencies = [
  "enum-as-inner",
  "semver",
@@ -886,9 +826,9 @@ dependencies = [
 
 [[package]]
 name = "prql-compiler"
-version = "0.9.3"
+version = "0.9.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5ff28e838b1be4227cc567a75c11caa3be25c5015f0e5fd21279c06e944ba44f"
+checksum = "f4d56865532fcf1abaa31fbb6da6fd9e90edc441c5c78bfe2870ee75187c7a3c"
 dependencies = [
  "anstream",
  "anyhow",
@@ -912,9 +852,9 @@ dependencies = [
 
 [[package]]
 name = "prql-parser"
-version = "0.9.3"
+version = "0.9.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3182e2ef0465a960eb02519b18768e39123d3c3a0037a2d2934055a3ef901870"
+checksum = "9360352e413390cfd26345f49279622b87581a3b748340d3f42d4d616c2a1ec1"
 dependencies = [
  "chumsky",
  "itertools 0.11.0",
@@ -933,18 +873,18 @@ dependencies = [
 
 [[package]]
 name = "quote"
-version = "1.0.31"
+version = "1.0.33"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5fe8a65d69dd0808184ebb5f836ab526bb259db23c657efa38711b1072ee47f0"
+checksum = "5267fca4496028628a95160fc423a33e8b2e6af8a5302579e322e4b520293cae"
 dependencies = [
  "proc-macro2",
 ]
 
 [[package]]
 name = "rayon"
-version = "1.7.0"
+version = "1.8.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1d2df5196e37bcc87abebc0053e20787d73847bb33134a69841207dd0a47f03b"
+checksum = "9c27db03db7734835b3f53954b534c91069375ce6ccaa2e065441e07d9b6cdb1"
 dependencies = [
  "either",
  "rayon-core",
@@ -952,41 +892,39 @@ dependencies = [
 
 [[package]]
 name = "rayon-core"
-version = "1.11.0"
+version = "1.12.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4b8f95bd6966f5c87776639160a66bd8ab9895d9d4ab01ddba9fc60661aebe8d"
+checksum = "5ce3fb6ad83f861aac485e76e1985cd109d9a3713802152be56c3b1f0e0658ed"
 dependencies = [
- "crossbeam-channel",
  "crossbeam-deque",
  "crossbeam-utils",
- "num_cpus",
 ]
 
 [[package]]
 name = "redox_syscall"
-version = "0.2.16"
+version = "0.4.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "fb5a58c1855b4b6819d59012155603f0b22ad30cad752600aadfcb695265519a"
+checksum = "4722d768eff46b75989dd134e5c353f0d6296e5aaa3132e776cbdb56be7731aa"
 dependencies = [
  "bitflags 1.3.2",
 ]
 
 [[package]]
 name = "redox_users"
-version = "0.4.3"
+version = "0.4.4"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b033d837a7cf162d7993aded9304e30a83213c648b6e389db233191f891e5c2b"
+checksum = "a18479200779601e498ada4e8c1e1f50e3ee19deb0259c25825a98b5603b2cb4"
 dependencies = [
  "getrandom",
- "redox_syscall",
+ "libredox",
  "thiserror",
 ]
 
 [[package]]
 name = "regex"
-version = "1.9.1"
+version = "1.10.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b2eae68fc220f7cf2532e4494aded17545fce192d59cd996e0fe7887f4ceb575"
+checksum = "380b951a9c5e80ddfd6136919eef32310721aa4aacd4889a8d39124b026ab343"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -996,9 +934,9 @@ dependencies = [
 
 [[package]]
 name = "regex-automata"
-version = "0.3.3"
+version = "0.4.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "39354c10dd07468c2e73926b23bb9c2caca74c5501e38a35da70406f1d923310"
+checksum = "5f804c7828047e88b2d32e2d7fe5a105da8ee3264f01902f796c8e067dc2483f"
 dependencies = [
  "aho-corasick",
  "memchr",
@@ -1007,9 +945,9 @@ dependencies = [
 
 [[package]]
 name = "regex-syntax"
-version = "0.7.4"
+version = "0.8.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e5ea92a5b6195c6ef2a0295ea818b312502c6fc94dde986c5553242e18fd4ce2"
+checksum = "c08c74e62047bb2de4ff487b251e4a92e24f48745648451635cec7d591162d9f"
 
 [[package]]
 name = "rustc-demangle"
@@ -1019,15 +957,15 @@ checksum = "d626bb9dae77e28219937af045c257c28bfd3f69333c512553507f5f9798cb76"
 
 [[package]]
 name = "rustix"
-version = "0.38.6"
+version = "0.38.28"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1ee020b1716f0a80e2ace9b03441a749e402e86712f15f16fe8a8f75afac732f"
+checksum = "72e572a5e8ca657d7366229cdde4bd14c4eb5499a9573d4d366fe1b599daa316"
 dependencies = [
- "bitflags 2.3.3",
+ "bitflags 2.4.1",
  "errno",
  "libc",
  "linux-raw-sys",
- "windows-sys",
+ "windows-sys 0.52.0",
 ]
 
 [[package]]
@@ -1038,15 +976,9 @@ checksum = "7ffc183a10b4478d04cbbbfc96d0873219d962dd5accaff2ffbd4ceb7df837f4"
 
 [[package]]
 name = "ryu"
-version = "1.0.15"
+version = "1.0.16"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1ad4cc8da4ef723ed60bced201181d83791ad433213d8c24efffda1eec85d741"
-
-[[package]]
-name = "scopeguard"
-version = "1.2.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "94143f37725109f92c262ed2cf5e59bce7498c01bcc1502d7b9afe439a4e9f49"
+checksum = "f98d2aa92eebf49b69786be48e4477826b256916e84a57ff2a4f21923b48eb4c"
 
 [[package]]
 name = "scratch"
@@ -1056,38 +988,38 @@ checksum = "a3cf7c11c38cb994f3d40e8a8cde3bbd1f72a435e4c49e85d6553d8312306152"
 
 [[package]]
 name = "semver"
-version = "1.0.18"
+version = "1.0.20"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b0293b4b29daaf487284529cc2f5675b8e57c61f70167ba415a463651fd6a918"
+checksum = "836fa6a3e1e547f9a2c4040802ec865b5d85f4014efe00555d7090a3dcaa1090"
 dependencies = [
  "serde",
 ]
 
 [[package]]
 name = "serde"
-version = "1.0.174"
+version = "1.0.193"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "3b88756493a5bd5e5395d53baa70b194b05764ab85b59e43e4b8f4e1192fa9b1"
+checksum = "25dd9975e68d0cb5aa1120c288333fc98731bd1dd12f561e468ea4728c042b89"
 dependencies = [
  "serde_derive",
 ]
 
 [[package]]
 name = "serde_derive"
-version = "1.0.174"
+version = "1.0.193"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6e5c3a298c7f978e53536f95a63bdc4c4a64550582f31a0359a9afda6aede62e"
+checksum = "43576ca501357b9b071ac53cdc7da8ef0cbd9493d8df094cd821777ea6e894d3"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.27",
+ "syn 2.0.41",
 ]
 
 [[package]]
 name = "serde_json"
-version = "1.0.103"
+version = "1.0.108"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "d03b412469450d4404fe8499a268edd7f8b79fecb074b0d812ad64ca21f4031b"
+checksum = "3d1c7e3eac408d115102c4c24ad393e0821bb3a5df4d506a80f85f7a742a526b"
 dependencies = [
  "itoa",
  "ryu",
@@ -1112,7 +1044,7 @@ dependencies = [
  "nix 0.25.1",
  "rayon",
  "regex",
- "time 0.3.23",
+ "time",
  "timer",
  "tuikit",
  "unicode-width",
@@ -1121,20 +1053,20 @@ dependencies = [
 
 [[package]]
 name = "sqlformat"
-version = "0.2.1"
+version = "0.2.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "0c12bc9199d1db8234678b7051747c07f517cdcf019262d1847b94ec8b1aee3e"
+checksum = "ce81b7bd7c4493975347ef60d8c7e8b742d4694f4c49f93e0a12ea263938176c"
 dependencies = [
- "itertools 0.10.5",
+ "itertools 0.12.0",
  "nom",
  "unicode_categories",
 ]
 
 [[package]]
 name = "sqlparser"
-version = "0.36.1"
+version = "0.37.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "2eaa1e88e78d2c2460d78b7dc3f0c08dbb606ab4222f9aff36f420d36e307d87"
+checksum = "37ae05a8250b968a3f7db93155a84d68b2e6cea1583949af5ca5b5170c76c075"
 dependencies = [
  "log",
  "serde",
@@ -1170,23 +1102,17 @@ dependencies = [
 
 [[package]]
 name = "strum_macros"
-version = "0.25.1"
+version = "0.25.3"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "6069ca09d878a33f883cc06aaa9718ede171841d3832450354410b718b097232"
+checksum = "23dc1fa9ac9c169a78ba62f0b841814b7abae11bdd047b9c58f893439e309ea0"
 dependencies = [
  "heck",
  "proc-macro2",
  "quote",
  "rustversion",
- "syn 2.0.27",
+ "syn 2.0.41",
 ]
 
-[[package]]
-name = "subtle"
-version = "2.5.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "81cdd64d312baedb58e21336b31bc043b77e01cc99033ce76ef539f78e965ebc"
-
 [[package]]
 name = "syn"
 version = "1.0.109"
@@ -1200,9 +1126,9 @@ dependencies = [
 
 [[package]]
 name = "syn"
-version = "2.0.27"
+version = "2.0.41"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b60f673f44a8255b9c8c657daf66a596d435f2da81a555b06dc644d080ba45e0"
+checksum = "44c8b28c477cc3bf0e7966561e3460130e1255f7a1cf71931075f1c5e7a7e269"
 dependencies = [
  "proc-macro2",
  "quote",
@@ -1222,31 +1148,31 @@ dependencies = [
 
 [[package]]
 name = "termcolor"
-version = "1.2.0"
+version = "1.4.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "be55cf8942feac5c765c2c993422806843c9a9a45d4d5c407ad6dd2ea95eb9b6"
+checksum = "ff1bc3d3f05aff0403e8ac0d92ced918ec05b666a43f83297ccef5bea8a3d449"
 dependencies = [
  "winapi-util",
 ]
 
 [[package]]
 name = "thiserror"
-version = "1.0.44"
+version = "1.0.51"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "611040a08a0439f8248d1990b111c95baa9c704c805fa1f62104b39655fd7f90"
+checksum = "f11c217e1416d6f036b870f14e0413d480dbf28edbee1f877abaf0206af43bb7"
 dependencies = [
  "thiserror-impl",
 ]
 
 [[package]]
 name = "thiserror-impl"
-version = "1.0.44"
+version = "1.0.51"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "090198534930841fab3a5d1bb637cde49e339654e606195f8d9c76eeb081dc96"
+checksum = "01742297787513b79cf8e29d1056ede1313e2420b7b3b15d0a768b4921f549df"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.27",
+ "syn 2.0.41",
 ]
 
 [[package]]
@@ -1261,30 +1187,21 @@ dependencies = [
 
 [[package]]
 name = "time"
-version = "0.1.45"
+version = "0.3.30"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1b797afad3f312d1c66a56d11d0316f916356d11bd158fbc6ca6389ff6bf805a"
-dependencies = [
- "libc",
- "wasi 0.10.0+wasi-snapshot-preview1",
- "winapi",
-]
-
-[[package]]
-name = "time"
-version = "0.3.23"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "59e399c068f43a5d116fedaf73b203fa4f9c519f17e2b34f63221d3792f81446"
+checksum = "c4a34ab300f2dee6e562c10a046fc05e358b29f9bf92277f30c3c8d82275f6f5"
 dependencies = [
+ "deranged",
+ "powerfmt",
  "serde",
  "time-core",
 ]
 
 [[package]]
 name = "time-core"
-version = "0.1.1"
+version = "0.1.2"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7300fbefb4dadc1af235a9cef3737cea692a9d97e1b9cbcd4ebdae6f8868e6fb"
+checksum = "ef927ca75afb808a4d64dd374f00a2adf8d0fcff8e7b184af886c3c87ec4a3f3"
 
 [[package]]
 name = "timer"
@@ -1309,23 +1226,17 @@ dependencies = [
  "unicode-width",
 ]
 
-[[package]]
-name = "typenum"
-version = "1.16.0"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "497961ef93d974e23eb6f433eb5fe1b7930b659f06d12dec6fc44a8f554c0bba"
-
 [[package]]
 name = "unicode-ident"
-version = "1.0.11"
+version = "1.0.12"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "301abaae475aa91687eb82514b328ab47a211a533026cb25fc3e519b86adfc3c"
+checksum = "3354b9ac3fae1ff6755cb6db53683adb661634f67557942dea4facebec0fee4b"
 
 [[package]]
 name = "unicode-width"
-version = "0.1.10"
+version = "0.1.11"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "c0edd1e5b14653f783770bce4a4dabb4a5108a5370a5f5d8cfe8710c361f6c8b"
+checksum = "e51733f11c9c4f72aa0c160008246859e340b00807569a0da0e7a1079b27ba85"
 
 [[package]]
 name = "unicode_categories"
@@ -1366,12 +1277,6 @@ dependencies = [
  "quote",
 ]
 
-[[package]]
-name = "wasi"
-version = "0.10.0+wasi-snapshot-preview1"
-source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1a143597ca7c7793eff794def352d41792a93c481eb1042423ff7ff72ba2c31f"
-
 [[package]]
 name = "wasi"
 version = "0.11.0+wasi-snapshot-preview1"
@@ -1380,9 +1285,9 @@ checksum = "9c8d87e72b64a3b4db28d11ce29237c246188f4f51057d65a7eab63b7987e423"
 
 [[package]]
 name = "wasm-bindgen"
-version = "0.2.87"
+version = "0.2.89"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7706a72ab36d8cb1f80ffbf0e071533974a60d0a308d01a5d0375bf60499a342"
+checksum = "0ed0d4f68a3015cc185aff4db9506a015f4b96f95303897bfa23f846db54064e"
 dependencies = [
  "cfg-if",
  "wasm-bindgen-macro",
@@ -1390,24 +1295,24 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-backend"
-version = "0.2.87"
+version = "0.2.89"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "5ef2b6d3c510e9625e5fe6f509ab07d66a760f0885d858736483c32ed7809abd"
+checksum = "1b56f625e64f3a1084ded111c4d5f477df9f8c92df113852fa5a374dbda78826"
 dependencies = [
  "bumpalo",
  "log",
  "once_cell",
  "proc-macro2",
  "quote",
- "syn 2.0.27",
+ "syn 2.0.41",
  "wasm-bindgen-shared",
 ]
 
 [[package]]
 name = "wasm-bindgen-macro"
-version = "0.2.87"
+version = "0.2.89"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "dee495e55982a3bd48105a7b947fd2a9b4a8ae3010041b9e0faab3f9cd028f1d"
+checksum = "0162dbf37223cd2afce98f3d0785506dcb8d266223983e4b5b525859e6e182b2"
 dependencies = [
  "quote",
  "wasm-bindgen-macro-support",
@@ -1415,22 +1320,22 @@ dependencies = [
 
 [[package]]
 name = "wasm-bindgen-macro-support"
-version = "0.2.87"
+version = "0.2.89"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "54681b18a46765f095758388f2d0cf16eb8d4169b639ab575a8f5693af210c7b"
+checksum = "f0eb82fcb7930ae6219a7ecfd55b217f5f0893484b7a13022ebb2b2bf20b5283"
 dependencies = [
  "proc-macro2",
  "quote",
- "syn 2.0.27",
+ "syn 2.0.41",
  "wasm-bindgen-backend",
  "wasm-bindgen-shared",
 ]
 
 [[package]]
 name = "wasm-bindgen-shared"
-version = "0.2.87"
+version = "0.2.89"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ca6ad05a4870b2bf5fe995117d3728437bd27d7cd5f06f13c17443ef369775a1"
+checksum = "7ab9b36309365056cd639da3134bf87fa8f3d86008abf99e612384a6eecd459f"
 
 [[package]]
 name = "winapi"
@@ -1450,9 +1355,9 @@ checksum = "ac3b87c63620426dd9b991e5ce0329eff545bccbbb34f3be09ff6fb6ab51b7b6"
 
 [[package]]
 name = "winapi-util"
-version = "0.1.5"
+version = "0.1.6"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "70ec6ce85bb158151cae5e5c87f95a8e97d2c0c4b001223f33a334e3ce5de178"
+checksum = "f29e6f9198ba0d26b4c9f07dbe6f9ed633e1f3d5b8b414090084349e46a52596"
 dependencies = [
  "winapi",
 ]
@@ -1464,12 +1369,12 @@ source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "712e227841d057c1ee1cd2fb22fa7e5a5461ae8e48fa2ca79ec42cfc1931183f"
 
 [[package]]
-name = "windows"
-version = "0.48.0"
+name = "windows-core"
+version = "0.51.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "e686886bc078bc1b0b600cac0147aadb815089b6e4da64016cbd754b6342700f"
+checksum = "f1f8cf84f35d2db49a46868f947758c7a1138116f7fac3bc844f43ade1292e64"
 dependencies = [
- "windows-targets",
+ "windows-targets 0.48.5",
 ]
 
 [[package]]
@@ -1478,68 +1383,154 @@ version = "0.48.0"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "677d2418bec65e3338edb076e806bc1ec15693c5d0104683f2efe857f61056a9"
 dependencies = [
- "windows-targets",
+ "windows-targets 0.48.5",
+]
+
+[[package]]
+name = "windows-sys"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "282be5f36a8ce781fad8c8ae18fa3f9beff57ec1b52cb3de0789201425d9a33d"
+dependencies = [
+ "windows-targets 0.52.0",
 ]
 
 [[package]]
 name = "windows-targets"
-version = "0.48.1"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "05d4b17490f70499f20b9e791dcf6a299785ce8af4d709018206dc5b4953e95f"
+checksum = "9a2fa6e2155d7247be68c096456083145c183cbbbc2764150dda45a87197940c"
 dependencies = [
- "windows_aarch64_gnullvm",
- "windows_aarch64_msvc",
- "windows_i686_gnu",
- "windows_i686_msvc",
- "windows_x86_64_gnu",
- "windows_x86_64_gnullvm",
- "windows_x86_64_msvc",
+ "windows_aarch64_gnullvm 0.48.5",
+ "windows_aarch64_msvc 0.48.5",
+ "windows_i686_gnu 0.48.5",
+ "windows_i686_msvc 0.48.5",
+ "windows_x86_64_gnu 0.48.5",
+ "windows_x86_64_gnullvm 0.48.5",
+ "windows_x86_64_msvc 0.48.5",
+]
+
+[[package]]
+name = "windows-targets"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "8a18201040b24831fbb9e4eb208f8892e1f50a37feb53cc7ff887feb8f50e7cd"
+dependencies = [
+ "windows_aarch64_gnullvm 0.52.0",
+ "windows_aarch64_msvc 0.52.0",
+ "windows_i686_gnu 0.52.0",
+ "windows_i686_msvc 0.52.0",
+ "windows_x86_64_gnu 0.52.0",
+ "windows_x86_64_gnullvm 0.52.0",
+ "windows_x86_64_msvc 0.52.0",
 ]
 
 [[package]]
 name = "windows_aarch64_gnullvm"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "91ae572e1b79dba883e0d315474df7305d12f569b400fcf90581b06062f7e1bc"
+checksum = "2b38e32f0abccf9987a4e3079dfb67dcd799fb61361e53e2882c3cbaf0d905d8"
+
+[[package]]
+name = "windows_aarch64_gnullvm"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "cb7764e35d4db8a7921e09562a0304bf2f93e0a51bfccee0bd0bb0b666b015ea"
 
 [[package]]
 name = "windows_aarch64_msvc"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "b2ef27e0d7bdfcfc7b868b317c1d32c641a6fe4629c171b8928c7b08d98d7cf3"
+checksum = "dc35310971f3b2dbbf3f0690a219f40e2d9afcf64f9ab7cc1be722937c26b4bc"
+
+[[package]]
+name = "windows_aarch64_msvc"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "bbaa0368d4f1d2aaefc55b6fcfee13f41544ddf36801e793edbbfd7d7df075ef"
 
 [[package]]
 name = "windows_i686_gnu"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "622a1962a7db830d6fd0a69683c80a18fda201879f0f447f065a3b7467daa241"
+checksum = "a75915e7def60c94dcef72200b9a8e58e5091744960da64ec734a6c6e9b3743e"
+
+[[package]]
+name = "windows_i686_gnu"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "a28637cb1fa3560a16915793afb20081aba2c92ee8af57b4d5f28e4b3e7df313"
 
 [[package]]
 name = "windows_i686_msvc"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "4542c6e364ce21bf45d69fdd2a8e455fa38d316158cfd43b3ac1c5b1b19f8e00"
+checksum = "8f55c233f70c4b27f66c523580f78f1004e8b5a8b659e05a4eb49d4166cca406"
+
+[[package]]
+name = "windows_i686_msvc"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "ffe5e8e31046ce6230cc7215707b816e339ff4d4d67c65dffa206fd0f7aa7b9a"
 
 [[package]]
 name = "windows_x86_64_gnu"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "ca2b8a661f7628cbd23440e50b05d705db3686f894fc9580820623656af974b1"
+checksum = "53d40abd2583d23e4718fddf1ebec84dbff8381c07cae67ff7768bbf19c6718e"
+
+[[package]]
+name = "windows_x86_64_gnu"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "3d6fa32db2bc4a2f5abeacf2b69f7992cd09dca97498da74a151a3132c26befd"
 
 [[package]]
 name = "windows_x86_64_gnullvm"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "7896dbc1f41e08872e9d5e8f8baa8fdd2677f29468c4e156210174edc7f7b953"
+checksum = "0b7b52767868a23d5bab768e390dc5f5c55825b6d30b86c844ff2dc7414044cc"
+
+[[package]]
+name = "windows_x86_64_gnullvm"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1a657e1e9d3f514745a572a6846d3c7aa7dbe1658c056ed9c3344c4109a6949e"
 
 [[package]]
 name = "windows_x86_64_msvc"
-version = "0.48.0"
+version = "0.48.5"
 source = "registry+https://github.com/rust-lang/crates.io-index"
-checksum = "1a515f5799fe4961cb532f983ce2b23082366b898e52ffbce459c86f67c8378a"
+checksum = "ed94fce61571a4006852b7389a063ab983c02eb1bb37b47f8272ce92d06d9538"
+
+[[package]]
+name = "windows_x86_64_msvc"
+version = "0.52.0"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "dff9641d1cd4be8d1a070daf9e3773c5f67e78b4d9d42263020c057706765c04"
 
 [[package]]
 name = "yansi"
 version = "0.5.1"
 source = "registry+https://github.com/rust-lang/crates.io-index"
 checksum = "09041cd90cf85f7f8b2df60c646f853b7f535ce68f85244eb6731cf89fa498ec"
+
+[[package]]
+name = "zerocopy"
+version = "0.7.31"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "1c4061bedbb353041c12f413700357bec76df2c7e2ca8e4df8bac24c6bf68e3d"
+dependencies = [
+ "zerocopy-derive",
+]
+
+[[package]]
+name = "zerocopy-derive"
+version = "0.7.31"
+source = "registry+https://github.com/rust-lang/crates.io-index"
+checksum = "b3c129550b3e6de3fd0ba67ba5c81818f9805e58b8d7fee80a3a59d2c9fc601a"
+dependencies = [
+ "proc-macro2",
+ "quote",
+ "syn 2.0.41",
+]
diff --git a/rust/Cargo.toml b/rust/Cargo.toml
index 2a2b582cea8..ac8b31a7290 100644
--- a/rust/Cargo.toml
+++ b/rust/Cargo.toml
@@ -1,7 +1,6 @@
 # workspace is required to vendor crates for all packages.
 [workspace]
 members = [
-    "BLAKE3",
     "skim",
     "prql",
 ]
diff --git a/src/Access/Common/AccessType.h b/src/Access/Common/AccessType.h
index f99ae2a8aea..463be6a3aea 100644
--- a/src/Access/Common/AccessType.h
+++ b/src/Access/Common/AccessType.h
@@ -82,7 +82,8 @@ enum class AccessType
     \
     M(ALTER_VIEW_REFRESH, "ALTER LIVE VIEW REFRESH, REFRESH VIEW", VIEW, ALTER_VIEW) \
     M(ALTER_VIEW_MODIFY_QUERY, "ALTER TABLE MODIFY QUERY", VIEW, ALTER_VIEW) \
-    M(ALTER_VIEW, "", GROUP, ALTER) /* allows to execute ALTER VIEW REFRESH, ALTER VIEW MODIFY QUERY;
+    M(ALTER_VIEW_MODIFY_REFRESH, "ALTER TABLE MODIFY QUERY", VIEW, ALTER_VIEW) \
+    M(ALTER_VIEW, "", GROUP, ALTER) /* allows to execute ALTER VIEW REFRESH, ALTER VIEW MODIFY QUERY, ALTER VIEW MODIFY REFRESH;
                                        implicitly enabled by the grant ALTER_TABLE */\
     \
     M(ALTER, "", GROUP, ALL) /* allows to execute ALTER {TABLE|LIVE VIEW} */\
@@ -177,12 +178,14 @@ enum class AccessType
     M(SYSTEM_MOVES, "SYSTEM STOP MOVES, SYSTEM START MOVES, STOP MOVES, START MOVES", TABLE, SYSTEM) \
     M(SYSTEM_PULLING_REPLICATION_LOG, "SYSTEM STOP PULLING REPLICATION LOG, SYSTEM START PULLING REPLICATION LOG", TABLE, SYSTEM) \
     M(SYSTEM_CLEANUP, "SYSTEM STOP CLEANUP, SYSTEM START CLEANUP", TABLE, SYSTEM) \
+    M(SYSTEM_VIEWS, "SYSTEM REFRESH VIEW, SYSTEM START VIEWS, SYSTEM STOP VIEWS, SYSTEM START VIEW, SYSTEM STOP VIEW, SYSTEM CANCEL VIEW, REFRESH VIEW, START VIEWS, STOP VIEWS, START VIEW, STOP VIEW, CANCEL VIEW", VIEW, SYSTEM) \
     M(SYSTEM_DISTRIBUTED_SENDS, "SYSTEM STOP DISTRIBUTED SENDS, SYSTEM START DISTRIBUTED SENDS, STOP DISTRIBUTED SENDS, START DISTRIBUTED SENDS", TABLE, SYSTEM_SENDS) \
     M(SYSTEM_REPLICATED_SENDS, "SYSTEM STOP REPLICATED SENDS, SYSTEM START REPLICATED SENDS, STOP REPLICATED SENDS, START REPLICATED SENDS", TABLE, SYSTEM_SENDS) \
     M(SYSTEM_SENDS, "SYSTEM STOP SENDS, SYSTEM START SENDS, STOP SENDS, START SENDS", GROUP, SYSTEM) \
     M(SYSTEM_REPLICATION_QUEUES, "SYSTEM STOP REPLICATION QUEUES, SYSTEM START REPLICATION QUEUES, STOP REPLICATION QUEUES, START REPLICATION QUEUES", TABLE, SYSTEM) \
     M(SYSTEM_DROP_REPLICA, "DROP REPLICA", TABLE, SYSTEM) \
     M(SYSTEM_SYNC_REPLICA, "SYNC REPLICA", TABLE, SYSTEM) \
+    M(SYSTEM_REPLICA_READINESS, "SYSTEM REPLICA READY, SYSTEM REPLICA UNREADY", GLOBAL, SYSTEM) \
     M(SYSTEM_RESTART_REPLICA, "RESTART REPLICA", TABLE, SYSTEM) \
     M(SYSTEM_RESTORE_REPLICA, "RESTORE REPLICA", TABLE, SYSTEM) \
     M(SYSTEM_WAIT_LOADING_PARTS, "WAIT LOADING PARTS", TABLE, SYSTEM) \
diff --git a/src/Access/ContextAccess.cpp b/src/Access/ContextAccess.cpp
index 90fddd0085d..567b131c00e 100644
--- a/src/Access/ContextAccess.cpp
+++ b/src/Access/ContextAccess.cpp
@@ -155,6 +155,7 @@ namespace
                 "formats",
                 "privileges",
                 "data_type_families",
+                "database_engines",
                 "table_engines",
                 "table_functions",
                 "aggregate_function_combinators",
diff --git a/src/Access/tests/gtest_access_rights_ops.cpp b/src/Access/tests/gtest_access_rights_ops.cpp
index b5a15513a89..a7594503992 100644
--- a/src/Access/tests/gtest_access_rights_ops.cpp
+++ b/src/Access/tests/gtest_access_rights_ops.cpp
@@ -51,7 +51,7 @@ TEST(AccessRights, Union)
               "CREATE DICTIONARY, DROP DATABASE, DROP TABLE, DROP VIEW, DROP DICTIONARY, UNDROP TABLE, "
               "TRUNCATE, OPTIMIZE, BACKUP, CREATE ROW POLICY, ALTER ROW POLICY, DROP ROW POLICY, "
               "SHOW ROW POLICIES, SYSTEM MERGES, SYSTEM TTL MERGES, SYSTEM FETCHES, "
-              "SYSTEM MOVES, SYSTEM PULLING REPLICATION LOG, SYSTEM CLEANUP, SYSTEM SENDS, SYSTEM REPLICATION QUEUES, "
+              "SYSTEM MOVES, SYSTEM PULLING REPLICATION LOG, SYSTEM CLEANUP, SYSTEM VIEWS, SYSTEM SENDS, SYSTEM REPLICATION QUEUES, "
               "SYSTEM DROP REPLICA, SYSTEM SYNC REPLICA, SYSTEM RESTART REPLICA, "
               "SYSTEM RESTORE REPLICA, SYSTEM WAIT LOADING PARTS, SYSTEM SYNC DATABASE REPLICA, SYSTEM FLUSH DISTRIBUTED, dictGet ON db1.*, GRANT NAMED COLLECTION ADMIN ON db1");
 }
diff --git a/src/AggregateFunctions/AggregateFunctionAny.cpp b/src/AggregateFunctions/AggregateFunctionAny.cpp
index 15681eca817..a6010ff07c3 100644
--- a/src/AggregateFunctions/AggregateFunctionAny.cpp
+++ b/src/AggregateFunctions/AggregateFunctionAny.cpp
@@ -110,7 +110,7 @@ public:
                 }
             }
         }
-        else
+        else if (row_begin < row_end)
         {
             size_t pos = First ? row_begin : row_end - 1;
             add(place, columns, pos, arena);
diff --git a/src/AggregateFunctions/AggregateFunctionFactory.cpp b/src/AggregateFunctions/AggregateFunctionFactory.cpp
index 5c101888140..b6ba562045d 100644
--- a/src/AggregateFunctions/AggregateFunctionFactory.cpp
+++ b/src/AggregateFunctions/AggregateFunctionFactory.cpp
@@ -51,10 +51,10 @@ void AggregateFunctionFactory::registerFunction(const String & name, Value creat
 void AggregateFunctionFactory::registerNullsActionTransformation(const String & source_ignores_nulls, const String & target_respect_nulls)
 {
     if (!aggregate_functions.contains(source_ignores_nulls))
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "registerNullsActionTransformation: Source aggregation '{}' not found");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "registerNullsActionTransformation: Source aggregation '{}' not found", source_ignores_nulls);
 
     if (!aggregate_functions.contains(target_respect_nulls))
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "registerNullsActionTransformation: Target aggregation '{}' not found");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "registerNullsActionTransformation: Target aggregation '{}' not found", target_respect_nulls);
 
     if (!respect_nulls.emplace(source_ignores_nulls, target_respect_nulls).second)
         throw Exception(
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
index b95471df90a..6c6397e35d5 100644
--- a/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
+++ b/src/AggregateFunctions/AggregateFunctionGroupArray.cpp
@@ -20,6 +20,7 @@
 
 #include <Common/ArenaAllocator.h>
 #include <Common/assert_cast.h>
+#include <Common/thread_local_rng.h>
 
 #include <AggregateFunctions/IAggregateFunction.h>
 
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
deleted file mode 100644
index debc9b6d565..00000000000
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.cpp
+++ /dev/null
@@ -1,82 +0,0 @@
-#include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <AggregateFunctions/AggregateFunctionGroupArraySorted.h>
-#include <AggregateFunctions/Helpers.h>
-#include <AggregateFunctions/FactoryHelpers.h>
-#include <DataTypes/DataTypeDate.h>
-#include <DataTypes/DataTypeDateTime.h>
-#include <Common/Exception.h>
-
-namespace DB
-{
-struct Settings;
-
-namespace ErrorCodes
-{
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
-    extern const int BAD_ARGUMENTS;
-}
-
-namespace
-{
-
-template <template <typename> class AggregateFunctionTemplate, typename ... TArgs>
-AggregateFunctionPtr createWithNumericOrTimeType(const IDataType & argument_type, TArgs && ... args)
-{
-    WhichDataType which(argument_type);
-    if (which.idx == TypeIndex::Date) return std::make_shared<AggregateFunctionTemplate<UInt16>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::DateTime) return std::make_shared<AggregateFunctionTemplate<UInt32>>(std::forward<TArgs>(args)...);
-    if (which.idx == TypeIndex::IPv4) return std::make_shared<AggregateFunctionTemplate<IPv4>>(std::forward<TArgs>(args)...);
-    return AggregateFunctionPtr(createWithNumericType<AggregateFunctionTemplate, TArgs...>(argument_type, std::forward<TArgs>(args)...));
-}
-
-template <typename ... TArgs>
-inline AggregateFunctionPtr createAggregateFunctionGroupArraySortedImpl(const DataTypePtr & argument_type, const Array & parameters, TArgs ... args)
-{
-    if (auto res = createWithNumericOrTimeType<GroupArraySortedNumericImpl>(*argument_type, argument_type, parameters, std::forward<TArgs>(args)...))
-        return AggregateFunctionPtr(res);
-
-    WhichDataType which(argument_type);
-    return std::make_shared<GroupArraySortedGeneralImpl<GroupArraySortedNodeGeneral>>(argument_type, parameters, std::forward<TArgs>(args)...);
-}
-
-AggregateFunctionPtr createAggregateFunctionGroupArraySorted(
-    const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings *)
-{
-    assertUnary(name, argument_types);
-
-    UInt64 max_elems = std::numeric_limits<UInt64>::max();
-
-    if (parameters.empty())
-    {
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should have limit argument", name);
-    }
-    else if (parameters.size() == 1)
-    {
-        auto type = parameters[0].getType();
-        if (type != Field::Types::Int64 && type != Field::Types::UInt64)
-               throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should be positive number", name);
-
-        if ((type == Field::Types::Int64 && parameters[0].get<Int64>() < 0) ||
-            (type == Field::Types::UInt64 && parameters[0].get<UInt64>() == 0))
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Parameter for aggregate function {} should be positive number", name);
-
-        max_elems = parameters[0].get<UInt64>();
-    }
-    else
-        throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
-            "Function {} does not support this number of arguments", name);
-
-    return createAggregateFunctionGroupArraySortedImpl(argument_types[0], parameters, max_elems);
-}
-
-}
-
-
-void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory)
-{
-    AggregateFunctionProperties properties = { .returns_default_when_only_null = false, .is_order_dependent = false };
-
-    factory.registerFunction("groupArraySorted", { createAggregateFunctionGroupArraySorted, properties });
-}
-
-}
diff --git a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h b/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
deleted file mode 100644
index 5079eaad756..00000000000
--- a/src/AggregateFunctions/AggregateFunctionGroupArraySorted.h
+++ /dev/null
@@ -1,355 +0,0 @@
-#pragma once
-
-#include <IO/ReadHelpers.h>
-#include <IO/WriteHelpers.h>
-#include <IO/ReadBufferFromString.h>
-#include <IO/WriteBufferFromString.h>
-#include <IO/Operators.h>
-
-#include <DataTypes/DataTypeArray.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypesNumber.h>
-
-#include <Columns/ColumnArray.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnVector.h>
-#include <Functions/array/arraySort.h>
-
-#include <Common/Exception.h>
-#include <Common/ArenaAllocator.h>
-#include <Common/assert_cast.h>
-#include <Columns/ColumnConst.h>
-#include <DataTypes/IDataType.h>
-#include <base/sort.h>
-#include <Columns/IColumn.h>
-
-#include <AggregateFunctions/IAggregateFunction.h>
-
-#include <Common/RadixSort.h>
-#include <algorithm>
-#include <type_traits>
-#include <utility>
-
-#define AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE 0xFFFFFF
-
-namespace DB
-{
-struct Settings;
-
-namespace ErrorCodes
-{
-    extern const int TOO_LARGE_ARRAY_SIZE;
-}
-
-template <typename T>
-struct GroupArraySortedData;
-
-template <typename T>
-struct GroupArraySortedData
-{
-    /// For easy serialization.
-    static_assert(std::has_unique_object_representations_v<T> || std::is_floating_point_v<T>);
-
-    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
-    using Allocator = MixedAlignedArenaAllocator<alignof(T), 4096>;
-    using Array = PODArray<T, 32, Allocator>;
-
-    Array value;
-};
-
-template <typename T>
-class GroupArraySortedNumericImpl final
-    : public IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>
-{
-    using Data = GroupArraySortedData<T>;
-    UInt64 max_elems;
-    SerializationPtr serialization;
-
-public:
-    explicit GroupArraySortedNumericImpl(
-        const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
-        : IAggregateFunctionDataHelper<GroupArraySortedData<T>, GroupArraySortedNumericImpl<T>>(
-            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
-        , max_elems(max_elems_)
-        , serialization(data_type_->getDefaultSerialization())
-    {
-    }
-
-    String getName() const override { return "groupArraySorted"; }
-
-    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
-    {
-        const auto & row_value = assert_cast<const ColumnVector<T> &>(*columns[0]).getData()[row_num];
-        auto & cur_elems = this->data(place);
-
-        cur_elems.value.push_back(row_value, arena);
-
-        /// To optimize, we sort (2 * max_size) elements of input array over and over again
-        /// and after each loop we delete the last half of sorted array
-        if (cur_elems.value.size() >= max_elems * 2)
-        {
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
-            cur_elems.value.resize(max_elems, arena);
-        }
-    }
-
-    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
-    {
-        auto & cur_elems = this->data(place);
-        auto & rhs_elems = this->data(rhs);
-
-        if (rhs_elems.value.empty())
-            return;
-
-        if (rhs_elems.value.size())
-            cur_elems.value.insertByOffsets(rhs_elems.value, 0, rhs_elems.value.size(), arena);
-
-        RadixSort<RadixSortNumTraits<T>>::executeLSD(cur_elems.value.data(), cur_elems.value.size());
-
-        size_t elems_size = cur_elems.value.size() < max_elems ? cur_elems.value.size() : max_elems;
-        cur_elems.value.resize(elems_size, arena);
-    }
-
-    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
-    {
-        auto & value = this->data(place).value;
-        size_t size = value.size();
-        writeVarUInt(size, buf);
-
-        for (const auto & elem : value)
-            writeBinaryLittleEndian(elem, buf);
-    }
-
-    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
-    {
-        size_t size = 0;
-        readVarUInt(size, buf);
-
-        if (unlikely(size > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
-
-        auto & value = this->data(place).value;
-
-        value.resize(size, arena);
-        for (auto & element : value)
-            readBinaryLittleEndian(element, buf);
-    }
-
-    static void checkArraySize(size_t elems, size_t max_elems)
-    {
-        if (unlikely(elems > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
-                            "Too large array size {} (maximum: {})", elems, max_elems);
-    }
-
-    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
-    {
-        auto& value = this->data(place).value;
-
-        RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
-        size_t elems_size = value.size() < max_elems ? value.size() : max_elems;
-        value.resize(elems_size, arena);
-        size_t size = value.size();
-
-        ColumnArray & arr_to = assert_cast<ColumnArray &>(to);
-        ColumnArray::Offsets & offsets_to = arr_to.getOffsets();
-
-        offsets_to.push_back(offsets_to.back() + size);
-
-        if (size)
-        {
-            typename ColumnVector<T>::Container & data_to = assert_cast<ColumnVector<T> &>(arr_to.getData()).getData();
-            data_to.insert(this->data(place).value.begin(), this->data(place).value.end());
-            RadixSort<RadixSortNumTraits<T>>::executeLSD(value.data(), value.size());
-            value.resize(elems_size, arena);
-        }
-    }
-
-    bool allocatesMemoryInArena() const override { return true; }
-};
-
-
-template <typename Node, bool has_sampler>
-struct GroupArraySortedGeneralData;
-
-template <typename Node>
-struct GroupArraySortedGeneralData<Node, false>
-{
-    // Switch to ordinary Allocator after 4096 bytes to avoid fragmentation and trash in Arena
-    using Allocator = MixedAlignedArenaAllocator<alignof(Node *), 4096>;
-    using Array = PODArray<Field, 32, Allocator>;
-
-    Array value;
-};
-
-template <typename Node>
-struct GroupArraySortedNodeBase
-{
-    UInt64 size; // size of payload
-
-    /// Returns pointer to actual payload
-    char * data() { return reinterpret_cast<char *>(this) + sizeof(Node); }
-
-    const char * data() const { return reinterpret_cast<const char *>(this) + sizeof(Node); }
-};
-
-struct GroupArraySortedNodeString : public GroupArraySortedNodeBase<GroupArraySortedNodeString>
-{
-    using Node = GroupArraySortedNodeString;
-
-};
-
-struct GroupArraySortedNodeGeneral : public GroupArraySortedNodeBase<GroupArraySortedNodeGeneral>
-{
-    using Node = GroupArraySortedNodeGeneral;
-
-};
-
-/// Implementation of groupArraySorted for Generic data via Array
-template <typename Node>
-class GroupArraySortedGeneralImpl final
-    : public IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>
-{
-    using Data = GroupArraySortedGeneralData<Node, false>;
-    static Data & data(AggregateDataPtr __restrict place) { return *reinterpret_cast<Data *>(place); }
-    static const Data & data(ConstAggregateDataPtr __restrict place) { return *reinterpret_cast<const Data *>(place); }
-
-    DataTypePtr & data_type;
-    UInt64 max_elems;
-    SerializationPtr serialization;
-
-
-public:
-    GroupArraySortedGeneralImpl(const DataTypePtr & data_type_, const Array & parameters_, UInt64 max_elems_ = std::numeric_limits<UInt64>::max())
-        : IAggregateFunctionDataHelper<GroupArraySortedGeneralData<Node, false>, GroupArraySortedGeneralImpl<Node>>(
-            {data_type_}, parameters_, std::make_shared<DataTypeArray>(data_type_))
-        , data_type(this->argument_types[0])
-        , max_elems(max_elems_)
-        , serialization(data_type->getDefaultSerialization())
-    {
-    }
-
-    String getName() const override { return "groupArraySorted"; }
-
-    void add(AggregateDataPtr __restrict place, const IColumn ** columns, size_t row_num, Arena * arena) const override
-    {
-        auto & cur_elems = data(place);
-
-        cur_elems.value.push_back(columns[0][0][row_num], arena);
-
-        /// To optimize, we sort (2 * max_size) elements of input array over and over again and
-        /// after each loop we delete the last half of sorted array
-
-        if (cur_elems.value.size() >= max_elems * 2)
-        {
-            std::sort(cur_elems.value.begin(), cur_elems.value.begin() + (max_elems * 2));
-            cur_elems.value.erase(cur_elems.value.begin() + max_elems, cur_elems.value.begin() + (max_elems * 2));
-        }
-    }
-
-    void merge(AggregateDataPtr __restrict place, ConstAggregateDataPtr rhs, Arena * arena) const override
-    {
-        auto & cur_elems = data(place);
-        auto & rhs_elems = data(rhs);
-
-        if (rhs_elems.value.empty())
-            return;
-
-        UInt64 new_elems = rhs_elems.value.size();
-
-        for (UInt64 i = 0; i < new_elems; ++i)
-            cur_elems.value.push_back(rhs_elems.value[i], arena);
-
-        checkArraySize(cur_elems.value.size(), AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-
-        if (!cur_elems.value.empty())
-        {
-            std::sort(cur_elems.value.begin(), cur_elems.value.end());
-
-            if (cur_elems.value.size() > max_elems)
-                cur_elems.value.resize(max_elems, arena);
-        }
-    }
-
-    static void checkArraySize(size_t elems, size_t max_elems)
-    {
-        if (unlikely(elems > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE,
-                            "Too large array size {} (maximum: {})", elems, max_elems);
-    }
-
-    void serialize(ConstAggregateDataPtr __restrict place, WriteBuffer & buf, std::optional<size_t> /* version */) const override
-    {
-        auto & value = data(place).value;
-        size_t size = value.size();
-        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-        writeVarUInt(size, buf);
-
-        for (const Field & elem : value)
-        {
-            if (elem.isNull())
-            {
-                writeBinary(false, buf);
-            }
-            else
-            {
-                writeBinary(true, buf);
-                serialization->serializeBinary(elem, buf, {});
-            }
-        }
-    }
-
-    void deserialize(AggregateDataPtr __restrict place, ReadBuffer & buf, std::optional<size_t> /* version */, Arena * arena) const override
-    {
-        size_t size = 0;
-        readVarUInt(size, buf);
-
-        if (unlikely(size > max_elems))
-            throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Too large array size, it should not exceed {}", max_elems);
-
-        checkArraySize(size, AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ELEMENT_SIZE);
-        auto & value = data(place).value;
-
-        value.resize(size, arena);
-        for (Field & elem : value)
-        {
-            UInt8 is_null = 0;
-            readBinary(is_null, buf);
-            if (!is_null)
-                serialization->deserializeBinary(elem, buf, {});
-        }
-    }
-
-    void insertResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const override
-    {
-        auto & column_array = assert_cast<ColumnArray &>(to);
-        auto & value = data(place).value;
-
-        if (!value.empty())
-        {
-            std::sort(value.begin(), value.end());
-
-            if (value.size() > max_elems)
-                value.resize_exact(max_elems, arena);
-        }
-        auto & offsets = column_array.getOffsets();
-        offsets.push_back(offsets.back() + value.size());
-
-        auto & column_data = column_array.getData();
-
-        if (std::is_same_v<Node, GroupArraySortedNodeString>)
-        {
-            auto & string_offsets = assert_cast<ColumnString &>(column_data).getOffsets();
-            string_offsets.reserve(string_offsets.size() + value.size());
-        }
-
-        for (const Field& field : value)
-            column_data.insert(field);
-    }
-
-    bool allocatesMemoryInArena() const override { return true; }
-};
-
-#undef AGGREGATE_FUNCTION_GROUP_ARRAY_MAX_ARRAY_SIZE
-
-}
diff --git a/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp b/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp
index 83fc4f80c48..850a7c688ad 100644
--- a/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp
+++ b/src/AggregateFunctions/AggregateFunctionLargestTriangleThreeBuckets.cpp
@@ -16,6 +16,7 @@
 #include <IO/ReadHelpers.h>
 #include <Common/PODArray.h>
 #include <Common/assert_cast.h>
+#include <base/types.h>
 
 #include <boost/math/distributions/normal.hpp>
 
@@ -99,31 +100,39 @@ struct LargestTriangleThreeBucketsData : public StatisticalSample<Float64, Float
         }
 
         // Find the size of each bucket
-        size_t single_bucket_size = this->x.size() / total_buckets;
+        Float64 single_bucket_size = static_cast<Float64>(this->x.size() - 2) / static_cast<Float64>(total_buckets - 2);
 
         // Include the first data point
         result.emplace_back(std::make_pair(this->x[0], this->y[0]));
 
-        for (size_t i = 1; i < total_buckets - 1; ++i) // Skip the first and last bucket
+        // the start index of current bucket
+        size_t start_index = 1;
+        // the end index of current bucket, also is the start index of next bucket
+        size_t center_index = start_index + static_cast<int>(floor(single_bucket_size));
+
+        for (size_t i = 0; i < total_buckets - 2; ++i) // Skip the first and last bucket
         {
-            size_t start_index = i * single_bucket_size;
-            size_t end_index = (i + 1) * single_bucket_size;
+            // the end index of next bucket
+            size_t end_index = 1 + static_cast<int>(floor(single_bucket_size * (i + 2)));
+            // current bucket is the last bucket
+            if (end_index > this->x.size())
+                end_index = this->x.size();
 
             // Compute the average point in the next bucket
             Float64 avg_x = 0;
             Float64 avg_y = 0;
-            for (size_t j = end_index; j < (i + 2) * single_bucket_size; ++j)
+            for (size_t j = center_index; j < end_index; ++j)
             {
                 avg_x += this->x[j];
                 avg_y += this->y[j];
             }
-            avg_x /= single_bucket_size;
-            avg_y /= single_bucket_size;
+            avg_x /= static_cast<Float64>(end_index - center_index);
+            avg_y /= static_cast<Float64>(end_index - center_index);
 
             // Find the point in the current bucket that forms the largest triangle
             size_t max_index = start_index;
             Float64 max_area = 0.0;
-            for (size_t j = start_index; j < end_index; ++j)
+            for (size_t j = start_index; j < center_index; ++j)
             {
                 Float64 area = std::abs(
                     0.5
@@ -138,6 +147,9 @@ struct LargestTriangleThreeBucketsData : public StatisticalSample<Float64, Float
 
             // Include the selected point
             result.emplace_back(std::make_pair(this->x[max_index], this->y[max_index]));
+
+            start_index = center_index;
+            center_index = end_index;
         }
 
         // Include the last data point
diff --git a/src/AggregateFunctions/AggregateFunctionMax.cpp b/src/AggregateFunctions/AggregateFunctionMax.cpp
index 813129e42ec..e74224a24c3 100644
--- a/src/AggregateFunctions/AggregateFunctionMax.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMax.cpp
@@ -1,7 +1,7 @@
 #include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <AggregateFunctions/HelpersMinMaxAny.h>
 #include <AggregateFunctions/FactoryHelpers.h>
-
+#include <AggregateFunctions/HelpersMinMaxAny.h>
+#include <AggregateFunctions/findNumeric.h>
 
 namespace DB
 {
@@ -10,10 +10,122 @@ struct Settings;
 namespace
 {
 
+template <typename Data>
+class AggregateFunctionsSingleValueMax final : public AggregateFunctionsSingleValue<Data>
+{
+    using Parent = AggregateFunctionsSingleValue<Data>;
+
+public:
+    explicit AggregateFunctionsSingleValueMax(const DataTypePtr & type) : Parent(type) { }
+
+    /// Specializations for native numeric types
+    ALWAYS_INLINE inline void addBatchSinglePlace(
+        size_t row_begin,
+        size_t row_end,
+        AggregateDataPtr __restrict place,
+        const IColumn ** __restrict columns,
+        Arena * arena,
+        ssize_t if_argument_pos) const override;
+
+    ALWAYS_INLINE inline void addBatchSinglePlaceNotNull(
+        size_t row_begin,
+        size_t row_end,
+        AggregateDataPtr __restrict place,
+        const IColumn ** __restrict columns,
+        const UInt8 * __restrict null_map,
+        Arena * arena,
+        ssize_t if_argument_pos) const override;
+};
+
+// NOLINTBEGIN(bugprone-macro-parentheses)
+#define SPECIALIZE(TYPE) \
+template <> \
+void AggregateFunctionsSingleValueMax<typename DB::AggregateFunctionMaxData<SingleValueDataFixed<TYPE>>>::addBatchSinglePlace( \
+    size_t row_begin, \
+    size_t row_end, \
+    AggregateDataPtr __restrict place, \
+    const IColumn ** __restrict columns, \
+    Arena *, \
+    ssize_t if_argument_pos) const \
+{ \
+    const auto & column = assert_cast<const DB::AggregateFunctionMaxData<SingleValueDataFixed<TYPE>>::ColVecType &>(*columns[0]); \
+    std::optional<TYPE> opt; \
+    if (if_argument_pos >= 0) \
+    { \
+        const auto & flags = assert_cast<const ColumnUInt8 &>(*columns[if_argument_pos]).getData(); \
+        opt = findNumericMaxIf(column.getData().data(), flags.data(), row_begin, row_end); \
+    } \
+    else \
+        opt = findNumericMax(column.getData().data(), row_begin, row_end); \
+    if (opt.has_value()) \
+        this->data(place).changeIfGreater(opt.value()); \
+}
+// NOLINTEND(bugprone-macro-parentheses)
+
+FOR_BASIC_NUMERIC_TYPES(SPECIALIZE)
+#undef SPECIALIZE
+
+template <typename Data>
+void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlace(
+    size_t row_begin,
+    size_t row_end,
+    AggregateDataPtr __restrict place,
+    const IColumn ** __restrict columns,
+    Arena * arena,
+    ssize_t if_argument_pos) const
+{
+    return Parent::addBatchSinglePlace(row_begin, row_end, place, columns, arena, if_argument_pos);
+}
+
+// NOLINTBEGIN(bugprone-macro-parentheses)
+#define SPECIALIZE(TYPE) \
+template <> \
+void AggregateFunctionsSingleValueMax<typename DB::AggregateFunctionMaxData<SingleValueDataFixed<TYPE>>>::addBatchSinglePlaceNotNull( \
+    size_t row_begin, \
+    size_t row_end, \
+    AggregateDataPtr __restrict place, \
+    const IColumn ** __restrict columns, \
+    const UInt8 * __restrict null_map, \
+    Arena *, \
+    ssize_t if_argument_pos) const \
+{ \
+    const auto & column = assert_cast<const DB::AggregateFunctionMaxData<SingleValueDataFixed<TYPE>>::ColVecType &>(*columns[0]); \
+    std::optional<TYPE> opt; \
+    if (if_argument_pos >= 0) \
+    { \
+        const auto * if_flags = assert_cast<const ColumnUInt8 &>(*columns[if_argument_pos]).getData().data(); \
+        auto final_flags = std::make_unique<UInt8[]>(row_end); \
+        for (size_t i = row_begin; i < row_end; ++i) \
+            final_flags[i] = (!null_map[i]) & !!if_flags[i]; \
+        opt = findNumericMaxIf(column.getData().data(), final_flags.get(), row_begin, row_end); \
+    } \
+    else \
+        opt = findNumericMaxNotNull(column.getData().data(), null_map, row_begin, row_end); \
+    if (opt.has_value()) \
+        this->data(place).changeIfGreater(opt.value()); \
+}
+// NOLINTEND(bugprone-macro-parentheses)
+
+FOR_BASIC_NUMERIC_TYPES(SPECIALIZE)
+#undef SPECIALIZE
+
+template <typename Data>
+void AggregateFunctionsSingleValueMax<Data>::addBatchSinglePlaceNotNull(
+    size_t row_begin,
+    size_t row_end,
+    AggregateDataPtr __restrict place,
+    const IColumn ** __restrict columns,
+    const UInt8 * __restrict null_map,
+    Arena * arena,
+    ssize_t if_argument_pos) const
+{
+    return Parent::addBatchSinglePlaceNotNull(row_begin, row_end, place, columns, null_map, arena, if_argument_pos);
+}
+
 AggregateFunctionPtr createAggregateFunctionMax(
     const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings * settings)
 {
-    return AggregateFunctionPtr(createAggregateFunctionSingleValue<AggregateFunctionsSingleValue, AggregateFunctionMaxData>(name, argument_types, parameters, settings));
+    return AggregateFunctionPtr(createAggregateFunctionSingleValue<AggregateFunctionsSingleValueMax, AggregateFunctionMaxData>(name, argument_types, parameters, settings));
 }
 
 AggregateFunctionPtr createAggregateFunctionArgMax(
diff --git a/src/AggregateFunctions/AggregateFunctionMin.cpp b/src/AggregateFunctions/AggregateFunctionMin.cpp
index ac3e05121f7..48758aa74b0 100644
--- a/src/AggregateFunctions/AggregateFunctionMin.cpp
+++ b/src/AggregateFunctions/AggregateFunctionMin.cpp
@@ -1,6 +1,7 @@
 #include <AggregateFunctions/AggregateFunctionFactory.h>
-#include <AggregateFunctions/HelpersMinMaxAny.h>
 #include <AggregateFunctions/FactoryHelpers.h>
+#include <AggregateFunctions/HelpersMinMaxAny.h>
+#include <AggregateFunctions/findNumeric.h>
 
 
 namespace DB
@@ -10,10 +11,123 @@ struct Settings;
 namespace
 {
 
+template <typename Data>
+class AggregateFunctionsSingleValueMin final : public AggregateFunctionsSingleValue<Data>
+{
+    using Parent = AggregateFunctionsSingleValue<Data>;
+
+public:
+    explicit AggregateFunctionsSingleValueMin(const DataTypePtr & type) : Parent(type) { }
+
+    /// Specializations for native numeric types
+    ALWAYS_INLINE inline void addBatchSinglePlace(
+        size_t row_begin,
+        size_t row_end,
+        AggregateDataPtr __restrict place,
+        const IColumn ** __restrict columns,
+        Arena * arena,
+        ssize_t if_argument_pos) const override;
+
+    ALWAYS_INLINE inline void addBatchSinglePlaceNotNull(
+        size_t row_begin,
+        size_t row_end,
+        AggregateDataPtr __restrict place,
+        const IColumn ** __restrict columns,
+        const UInt8 * __restrict null_map,
+        Arena * arena,
+        ssize_t if_argument_pos) const override;
+};
+
+// NOLINTBEGIN(bugprone-macro-parentheses)
+#define SPECIALIZE(TYPE) \
+    template <> \
+    void AggregateFunctionsSingleValueMin<typename DB::AggregateFunctionMinData<SingleValueDataFixed<TYPE>>>::addBatchSinglePlace( \
+        size_t row_begin, \
+        size_t row_end, \
+        AggregateDataPtr __restrict place, \
+        const IColumn ** __restrict columns, \
+        Arena *, \
+        ssize_t if_argument_pos) const \
+    { \
+        const auto & column = assert_cast<const DB::AggregateFunctionMinData<SingleValueDataFixed<TYPE>>::ColVecType &>(*columns[0]); \
+        std::optional<TYPE> opt; \
+        if (if_argument_pos >= 0) \
+        { \
+            const auto & flags = assert_cast<const ColumnUInt8 &>(*columns[if_argument_pos]).getData(); \
+            opt = findNumericMinIf(column.getData().data(), flags.data(), row_begin, row_end); \
+        } \
+        else \
+            opt = findNumericMin(column.getData().data(), row_begin, row_end); \
+        if (opt.has_value()) \
+            this->data(place).changeIfLess(opt.value()); \
+    }
+// NOLINTEND(bugprone-macro-parentheses)
+
+FOR_BASIC_NUMERIC_TYPES(SPECIALIZE)
+#undef SPECIALIZE
+
+template <typename Data>
+void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlace(
+    size_t row_begin,
+    size_t row_end,
+    AggregateDataPtr __restrict place,
+    const IColumn ** __restrict columns,
+    Arena * arena,
+    ssize_t if_argument_pos) const
+{
+    return Parent::addBatchSinglePlace(row_begin, row_end, place, columns, arena, if_argument_pos);
+}
+
+// NOLINTBEGIN(bugprone-macro-parentheses)
+#define SPECIALIZE(TYPE) \
+    template <> \
+    void AggregateFunctionsSingleValueMin<typename DB::AggregateFunctionMinData<SingleValueDataFixed<TYPE>>>::addBatchSinglePlaceNotNull( \
+        size_t row_begin, \
+        size_t row_end, \
+        AggregateDataPtr __restrict place, \
+        const IColumn ** __restrict columns, \
+        const UInt8 * __restrict null_map, \
+        Arena *, \
+        ssize_t if_argument_pos) const \
+    { \
+        const auto & column = assert_cast<const DB::AggregateFunctionMinData<SingleValueDataFixed<TYPE>>::ColVecType &>(*columns[0]); \
+        std::optional<TYPE> opt; \
+        if (if_argument_pos >= 0) \
+        { \
+            const auto * if_flags = assert_cast<const ColumnUInt8 &>(*columns[if_argument_pos]).getData().data(); \
+            auto final_flags = std::make_unique<UInt8[]>(row_end); \
+            for (size_t i = row_begin; i < row_end; ++i) \
+                final_flags[i] = (!null_map[i]) & !!if_flags[i]; \
+            opt = findNumericMinIf(column.getData().data(), final_flags.get(), row_begin, row_end); \
+        } \
+        else \
+            opt = findNumericMinNotNull(column.getData().data(), null_map, row_begin, row_end); \
+        if (opt.has_value()) \
+            this->data(place).changeIfLess(opt.value()); \
+    }
+// NOLINTEND(bugprone-macro-parentheses)
+
+FOR_BASIC_NUMERIC_TYPES(SPECIALIZE)
+#undef SPECIALIZE
+
+template <typename Data>
+void AggregateFunctionsSingleValueMin<Data>::addBatchSinglePlaceNotNull(
+    size_t row_begin,
+    size_t row_end,
+    AggregateDataPtr __restrict place,
+    const IColumn ** __restrict columns,
+    const UInt8 * __restrict null_map,
+    Arena * arena,
+    ssize_t if_argument_pos) const
+{
+    return Parent::addBatchSinglePlaceNotNull(row_begin, row_end, place, columns, null_map, arena, if_argument_pos);
+}
+
 AggregateFunctionPtr createAggregateFunctionMin(
     const std::string & name, const DataTypes & argument_types, const Array & parameters, const Settings * settings)
 {
-    return AggregateFunctionPtr(createAggregateFunctionSingleValue<AggregateFunctionsSingleValue, AggregateFunctionMinData>(name, argument_types, parameters, settings));
+    return AggregateFunctionPtr(createAggregateFunctionSingleValue<AggregateFunctionsSingleValueMin, AggregateFunctionMinData>(
+        name, argument_types, parameters, settings));
 }
 
 AggregateFunctionPtr createAggregateFunctionArgMin(
diff --git a/src/AggregateFunctions/AggregateFunctionMinMaxAny.h b/src/AggregateFunctions/AggregateFunctionMinMaxAny.h
index ef1de76df79..b69a0b100a3 100644
--- a/src/AggregateFunctions/AggregateFunctionMinMaxAny.h
+++ b/src/AggregateFunctions/AggregateFunctionMinMaxAny.h
@@ -43,14 +43,12 @@ namespace ErrorCodes
 template <typename T>
 struct SingleValueDataFixed
 {
-private:
     using Self = SingleValueDataFixed;
     using ColVecType = ColumnVectorOrDecimal<T>;
 
     bool has_value = false; /// We need to remember if at least one value has been passed. This is necessary for AggregateFunctionIf.
     T value = T{};
 
-public:
     static constexpr bool result_is_nullable = false;
     static constexpr bool should_skip_null_arguments = true;
     static constexpr bool is_any = false;
@@ -157,6 +155,15 @@ public:
             return false;
     }
 
+    void changeIfLess(T from)
+    {
+        if (!has() || from < value)
+        {
+            has_value = true;
+            value = from;
+        }
+    }
+
     bool changeIfGreater(const IColumn & column, size_t row_num, Arena * arena)
     {
         if (!has() || assert_cast<const ColVecType &>(column).getData()[row_num] > value)
@@ -179,6 +186,15 @@ public:
             return false;
     }
 
+    void changeIfGreater(T & from)
+    {
+        if (!has() || from > value)
+        {
+            has_value = true;
+            value = from;
+        }
+    }
+
     bool isEqualTo(const Self & to) const
     {
         return has() && to.value == value;
@@ -448,7 +464,6 @@ public:
     }
 
 #endif
-
 };
 
 struct Compatibility
@@ -1214,7 +1229,7 @@ struct AggregateFunctionAnyHeavyData : Data
 
 
 template <typename Data>
-class AggregateFunctionsSingleValue final : public IAggregateFunctionDataHelper<Data, AggregateFunctionsSingleValue<Data>>
+class AggregateFunctionsSingleValue : public IAggregateFunctionDataHelper<Data, AggregateFunctionsSingleValue<Data>>
 {
     static constexpr bool is_any = Data::is_any;
 
@@ -1230,8 +1245,11 @@ public:
             || StringRef(Data::name()) == StringRef("max"))
         {
             if (!type->isComparable())
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of aggregate function {} "
-                                "because the values of that data type are not comparable", type->getName(), getName());
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Illegal type {} of argument of aggregate function {} because the values of that data type are not comparable",
+                    type->getName(),
+                    Data::name());
         }
     }
 
diff --git a/src/AggregateFunctions/AggregateFunctionSparkbar.cpp b/src/AggregateFunctions/AggregateFunctionSparkbar.cpp
index 7ff9df03824..b6e538520a8 100644
--- a/src/AggregateFunctions/AggregateFunctionSparkbar.cpp
+++ b/src/AggregateFunctions/AggregateFunctionSparkbar.cpp
@@ -378,6 +378,7 @@ AggregateFunctionPtr createAggregateFunctionSparkbar(const std::string & name, c
 void registerAggregateFunctionSparkbar(AggregateFunctionFactory & factory)
 {
     factory.registerFunction("sparkbar", createAggregateFunctionSparkbar);
+    factory.registerAlias("sparkBar", "sparkbar");
 }
 
 }
diff --git a/src/AggregateFunctions/AggregateFunctionSum.h b/src/AggregateFunctions/AggregateFunctionSum.h
index b3006f2ce82..5781ab69c6b 100644
--- a/src/AggregateFunctions/AggregateFunctionSum.h
+++ b/src/AggregateFunctions/AggregateFunctionSum.h
@@ -504,7 +504,7 @@ public:
             const auto * if_flags = assert_cast<const ColumnUInt8 &>(*columns[if_argument_pos]).getData().data();
             auto final_flags = std::make_unique<UInt8[]>(row_end);
             for (size_t i = row_begin; i < row_end; ++i)
-                final_flags[i] = (!null_map[i]) & if_flags[i];
+                final_flags[i] = (!null_map[i]) & !!if_flags[i];
 
             this->data(place).addManyConditional(column.getData().data(), final_flags.get(), row_begin, row_end);
         }
diff --git a/src/AggregateFunctions/AggregateFunctionSumMap.cpp b/src/AggregateFunctions/AggregateFunctionSumMap.cpp
index 04bc908396a..9f0873a6c9c 100644
--- a/src/AggregateFunctions/AggregateFunctionSumMap.cpp
+++ b/src/AggregateFunctions/AggregateFunctionSumMap.cpp
@@ -254,11 +254,20 @@ public:
             if (it != merged_maps.end())
             {
                 for (size_t col = 0; col < values_types.size(); ++col)
+                {
                     if (!elem.second[col].isNull())
-                        applyVisitor(Visitor(elem.second[col]), it->second[col]);
+                    {
+                        if (it->second[col].isNull())
+                            it->second[col] = elem.second[col];
+                        else
+                            applyVisitor(Visitor(elem.second[col]), it->second[col]);
+                    }
+                }
             }
             else
+            {
                 merged_maps[elem.first] = elem.second;
+            }
         }
     }
 
diff --git a/src/AggregateFunctions/IAggregateFunction.h b/src/AggregateFunctions/IAggregateFunction.h
index 2a62b76adbb..94bb121893d 100644
--- a/src/AggregateFunctions/IAggregateFunction.h
+++ b/src/AggregateFunctions/IAggregateFunction.h
@@ -197,7 +197,7 @@ public:
     virtual void insertMergeResultInto(AggregateDataPtr __restrict place, IColumn & to, Arena * arena) const
     {
         if (isState())
-            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Function {} is marked as State but method insertMergeResultInto is not implemented");
+            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Function {} is marked as State but method insertMergeResultInto is not implemented", getName());
 
         insertResultInto(place, to, arena);
     }
@@ -549,8 +549,10 @@ public:
         auto to = std::lower_bound(offsets.begin(), offsets.end(), row_end) - offsets.begin() + 1;
 
         size_t num_defaults = (row_end - row_begin) - (to - from);
-        static_cast<const Derived *>(this)->addBatchSinglePlace(from, to, place, &values, arena, -1);
-        static_cast<const Derived *>(this)->addManyDefaults(place, &values, num_defaults, arena);
+        if (from < to)
+            static_cast<const Derived *>(this)->addBatchSinglePlace(from, to, place, &values, arena, -1);
+        if (num_defaults > 0)
+            static_cast<const Derived *>(this)->addManyDefaults(place, &values, num_defaults, arena);
     }
 
     void addBatchSinglePlaceNotNull( /// NOLINT
diff --git a/src/AggregateFunctions/examples/quantile-t-digest.cpp b/src/AggregateFunctions/examples/quantile-t-digest.cpp
index b4e58e6203c..5360304b311 100644
--- a/src/AggregateFunctions/examples/quantile-t-digest.cpp
+++ b/src/AggregateFunctions/examples/quantile-t-digest.cpp
@@ -1,6 +1,7 @@
 #include <AggregateFunctions/QuantileTDigest.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/ReadBufferFromString.h>
+#include <iostream>
 
 int main(int, char **)
 {
diff --git a/src/AggregateFunctions/findNumeric.cpp b/src/AggregateFunctions/findNumeric.cpp
new file mode 100644
index 00000000000..bbad8c1fe3d
--- /dev/null
+++ b/src/AggregateFunctions/findNumeric.cpp
@@ -0,0 +1,15 @@
+#include <AggregateFunctions/findNumeric.h>
+
+namespace DB
+{
+#define INSTANTIATION(T) \
+    template std::optional<T> findNumericMin(const T * __restrict ptr, size_t start, size_t end); \
+    template std::optional<T> findNumericMinNotNull(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end); \
+    template std::optional<T> findNumericMinIf(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end); \
+    template std::optional<T> findNumericMax(const T * __restrict ptr, size_t start, size_t end); \
+    template std::optional<T> findNumericMaxNotNull(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end); \
+    template std::optional<T> findNumericMaxIf(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end);
+
+FOR_BASIC_NUMERIC_TYPES(INSTANTIATION)
+#undef INSTANTIATION
+}
diff --git a/src/AggregateFunctions/findNumeric.h b/src/AggregateFunctions/findNumeric.h
new file mode 100644
index 00000000000..df7c325569a
--- /dev/null
+++ b/src/AggregateFunctions/findNumeric.h
@@ -0,0 +1,154 @@
+#pragma once
+
+#include <DataTypes/IDataType.h>
+#include <base/defines.h>
+#include <base/types.h>
+#include <Common/Concepts.h>
+#include <Common/TargetSpecific.h>
+
+#include <algorithm>
+#include <optional>
+
+namespace DB
+{
+template <typename T>
+concept is_any_native_number = (is_any_of<T, Int8, Int16, Int32, Int64, UInt8, UInt16, UInt32, UInt64, Float32, Float64>);
+
+template <is_any_native_number T>
+struct MinComparator
+{
+    static ALWAYS_INLINE inline const T & cmp(const T & a, const T & b) { return std::min(a, b); }
+};
+
+template <is_any_native_number T>
+struct MaxComparator
+{
+    static ALWAYS_INLINE inline const T & cmp(const T & a, const T & b) { return std::max(a, b); }
+};
+
+MULTITARGET_FUNCTION_AVX2_SSE42(
+    MULTITARGET_FUNCTION_HEADER(template <is_any_native_number T, typename ComparatorClass, bool add_all_elements, bool add_if_cond_zero> static std::optional<T> NO_INLINE),
+    findNumericExtremeImpl,
+    MULTITARGET_FUNCTION_BODY((const T * __restrict ptr, const UInt8 * __restrict condition_map [[maybe_unused]], size_t row_begin, size_t row_end)
+    {
+        size_t count = row_end - row_begin;
+        ptr += row_begin;
+        if constexpr (!add_all_elements)
+            condition_map += row_begin;
+
+        T ret{};
+        size_t i = 0;
+        for (; i < count; i++)
+        {
+            if (add_all_elements || !condition_map[i] == add_if_cond_zero)
+            {
+                ret = ptr[i];
+                break;
+            }
+        }
+        if (i >= count)
+            return std::nullopt;
+
+        /// Unroll the loop manually for floating point, since the compiler doesn't do it without fastmath
+        /// as it might change the return value
+        if constexpr (std::is_floating_point_v<T>)
+        {
+            constexpr size_t unroll_block = 512 / sizeof(T); /// Chosen via benchmarks with AVX2 so YMMV
+            size_t unrolled_end = i + (((count - i) / unroll_block) * unroll_block);
+
+            if (i < unrolled_end)
+            {
+                T partial_min[unroll_block];
+                for (size_t unroll_it = 0; unroll_it < unroll_block; unroll_it++)
+                    partial_min[unroll_it] = ret;
+
+                while (i < unrolled_end)
+                {
+                    for (size_t unroll_it = 0; unroll_it < unroll_block; unroll_it++)
+                    {
+                        if (add_all_elements || !condition_map[i + unroll_it] == add_if_cond_zero)
+                            partial_min[unroll_it] = ComparatorClass::cmp(partial_min[unroll_it], ptr[i + unroll_it]);
+                    }
+                    i += unroll_block;
+                }
+                for (size_t unroll_it = 0; unroll_it < unroll_block; unroll_it++)
+                    ret = ComparatorClass::cmp(ret, partial_min[unroll_it]);
+            }
+        }
+
+        for (; i < count; i++)
+        {
+            if (add_all_elements || !condition_map[i] == add_if_cond_zero)
+                ret = ComparatorClass::cmp(ret, ptr[i]);
+        }
+
+        return ret;
+    }
+))
+
+
+/// Given a vector of T finds the extreme (MIN or MAX) value
+template <is_any_native_number T, class ComparatorClass, bool add_all_elements, bool add_if_cond_zero>
+static std::optional<T>
+findNumericExtreme(const T * __restrict ptr, const UInt8 * __restrict condition_map [[maybe_unused]], size_t start, size_t end)
+{
+#if USE_MULTITARGET_CODE
+    /// We see no benefit from using AVX512BW or AVX512F (over AVX2), so we only declare SSE and AVX2
+    if (isArchSupported(TargetArch::AVX2))
+        return findNumericExtremeImplAVX2<T, ComparatorClass, add_all_elements, add_if_cond_zero>(ptr, condition_map, start, end);
+
+    if (isArchSupported(TargetArch::SSE42))
+        return findNumericExtremeImplSSE42<T, ComparatorClass, add_all_elements, add_if_cond_zero>(ptr, condition_map, start, end);
+#endif
+    return findNumericExtremeImpl<T, ComparatorClass, add_all_elements, add_if_cond_zero>(ptr, condition_map, start, end);
+}
+
+template <is_any_native_number T>
+std::optional<T> findNumericMin(const T * __restrict ptr, size_t start, size_t end)
+{
+    return findNumericExtreme<T, MinComparator<T>, true, false>(ptr, nullptr, start, end);
+}
+
+template <is_any_native_number T>
+std::optional<T> findNumericMinNotNull(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end)
+{
+    return findNumericExtreme<T, MinComparator<T>, false, true>(ptr, condition_map, start, end);
+}
+
+template <is_any_native_number T>
+std::optional<T> findNumericMinIf(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end)
+{
+    return findNumericExtreme<T, MinComparator<T>, false, false>(ptr, condition_map, start, end);
+}
+
+template <is_any_native_number T>
+std::optional<T> findNumericMax(const T * __restrict ptr, size_t start, size_t end)
+{
+    return findNumericExtreme<T, MaxComparator<T>, true, false>(ptr, nullptr, start, end);
+}
+
+template <is_any_native_number T>
+std::optional<T> findNumericMaxNotNull(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end)
+{
+    return findNumericExtreme<T, MaxComparator<T>, false, true>(ptr, condition_map, start, end);
+}
+
+template <is_any_native_number T>
+std::optional<T> findNumericMaxIf(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end)
+{
+    return findNumericExtreme<T, MaxComparator<T>, false, false>(ptr, condition_map, start, end);
+}
+
+
+#define EXTERN_INSTANTIATION(T) \
+    extern template std::optional<T> findNumericMin(const T * __restrict ptr, size_t start, size_t end); \
+    extern template std::optional<T> findNumericMinNotNull(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end); \
+    extern template std::optional<T> findNumericMinIf(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end); \
+    extern template std::optional<T> findNumericMax(const T * __restrict ptr, size_t start, size_t end); \
+    extern template std::optional<T> findNumericMaxNotNull(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end); \
+    extern template std::optional<T> findNumericMaxIf(const T * __restrict ptr, const UInt8 * __restrict condition_map, size_t start, size_t end);
+
+    FOR_BASIC_NUMERIC_TYPES(EXTERN_INSTANTIATION)
+#undef EXTERN_INSTANTIATION
+
+}
diff --git a/src/AggregateFunctions/registerAggregateFunctions.cpp b/src/AggregateFunctions/registerAggregateFunctions.cpp
index eb3d94d1afb..96ba94aed91 100644
--- a/src/AggregateFunctions/registerAggregateFunctions.cpp
+++ b/src/AggregateFunctions/registerAggregateFunctions.cpp
@@ -15,7 +15,6 @@ void registerAggregateFunctionCount(AggregateFunctionFactory &);
 void registerAggregateFunctionDeltaSum(AggregateFunctionFactory &);
 void registerAggregateFunctionDeltaSumTimestamp(AggregateFunctionFactory &);
 void registerAggregateFunctionGroupArray(AggregateFunctionFactory &);
-void registerAggregateFunctionGroupArraySorted(AggregateFunctionFactory & factory);
 void registerAggregateFunctionGroupUniqArray(AggregateFunctionFactory &);
 void registerAggregateFunctionGroupArrayInsertAt(AggregateFunctionFactory &);
 void registerAggregateFunctionsQuantile(AggregateFunctionFactory &);
@@ -112,7 +111,6 @@ void registerAggregateFunctions()
         registerAggregateFunctionDeltaSum(factory);
         registerAggregateFunctionDeltaSumTimestamp(factory);
         registerAggregateFunctionGroupArray(factory);
-        registerAggregateFunctionGroupArraySorted(factory);
         registerAggregateFunctionGroupUniqArray(factory);
         registerAggregateFunctionGroupArrayInsertAt(factory);
         registerAggregateFunctionsQuantile(factory);
diff --git a/src/Analyzer/Passes/CNF.cpp b/src/Analyzer/Passes/CNF.cpp
index 91e973c7573..aa6ee539934 100644
--- a/src/Analyzer/Passes/CNF.cpp
+++ b/src/Analyzer/Passes/CNF.cpp
@@ -536,7 +536,8 @@ CNF CNF::toCNF(const QueryTreeNodePtr & node, ContextPtr context, size_t max_gro
     if (!cnf)
         throw Exception(ErrorCodes::TOO_MANY_TEMPORARY_COLUMNS,
             "Cannot convert expression '{}' to CNF, because it produces to many clauses."
-            "Size of boolean formula in CNF can be exponential of size of source formula.");
+            "Size of boolean formula in CNF can be exponential of size of source formula.",
+            node->formatConvertedASTForErrorMessage());
 
     return *cnf;
 }
diff --git a/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp b/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp
index 4e0562a2fe8..117e649ac88 100644
--- a/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp
+++ b/src/Analyzer/Passes/ComparisonTupleEliminationPass.cpp
@@ -1,6 +1,8 @@
 #include <Analyzer/Passes/ComparisonTupleEliminationPass.h>
 
 #include <DataTypes/DataTypeTuple.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeNothing.h>
 
 #include <Functions/FunctionFactory.h>
 
@@ -52,6 +54,13 @@ public:
         if (!isTuple(rhs_argument_result_type))
             return;
 
+        if (function_node->getResultType()->equals(DataTypeNullable(std::make_shared<DataTypeNothing>())))
+            /** The function `equals` can return Nullable(Nothing), e.g., in the case of (a, b) == (NULL, 1).
+              * On the other hand, `AND` returns Nullable(UInt8), so we would need to convert types.
+              * It's better to just skip this trivial case.
+              */
+            return;
+
         auto lhs_argument_node_type = lhs_argument->getNodeType();
         auto rhs_argument_node_type = rhs_argument->getNodeType();
 
diff --git a/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp b/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp
index 901867b8889..76b14c1a867 100644
--- a/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp
+++ b/src/Analyzer/Passes/IfTransformStringsToEnumPass.cpp
@@ -4,6 +4,7 @@
 #include <Analyzer/FunctionNode.h>
 #include <Analyzer/IQueryTreeNode.h>
 #include <Analyzer/InDepthQueryTreeVisitor.h>
+#include <Analyzer/Utils.h>
 
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeEnum.h>
@@ -41,22 +42,6 @@ DataTypePtr getEnumType(const std::set<std::string> & string_values)
         return getDataEnumType<DataTypeEnum8>(string_values);
 }
 
-QueryTreeNodePtr createCastFunction(QueryTreeNodePtr from, DataTypePtr result_type, ContextPtr context)
-{
-    auto enum_literal = std::make_shared<ConstantValue>(result_type->getName(), std::make_shared<DataTypeString>());
-    auto enum_literal_node = std::make_shared<ConstantNode>(std::move(enum_literal));
-
-    auto cast_function = FunctionFactory::instance().get("_CAST", std::move(context));
-    QueryTreeNodes arguments{ std::move(from), std::move(enum_literal_node) };
-
-    auto function_node = std::make_shared<FunctionNode>("_CAST");
-    function_node->getArguments().getNodes() = std::move(arguments);
-
-    function_node->resolveAsFunction(cast_function->build(function_node->getArgumentColumns()));
-
-    return function_node;
-}
-
 /// if(arg1, arg2, arg3) will be transformed to if(arg1, _CAST(arg2, Enum...), _CAST(arg3, Enum...))
 /// where Enum is generated based on the possible values stored in string_values
 void changeIfArguments(
diff --git a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
index 6fa6c8b0e78..59b3b036698 100644
--- a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
+++ b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.cpp
@@ -9,6 +9,8 @@
 #include <Analyzer/HashUtils.h>
 #include <Analyzer/Utils.h>
 
+#include <DataTypes/DataTypeLowCardinality.h>
+
 namespace DB
 {
 
@@ -248,13 +250,13 @@ public:
 
         if (function_node->getFunctionName() == "and")
         {
-            tryReplaceAndEqualsChainsWithConstant(node);
+            tryOptimizeAndEqualsNotEqualsChain(node);
             return;
         }
     }
 
 private:
-    void tryReplaceAndEqualsChainsWithConstant(QueryTreeNodePtr & node)
+    void tryOptimizeAndEqualsNotEqualsChain(QueryTreeNodePtr & node)
     {
         auto & function_node = node->as<FunctionNode &>();
         assert(function_node.getFunctionName() == "and");
@@ -264,53 +266,132 @@ private:
 
         QueryTreeNodes and_operands;
 
-        QueryTreeNodePtrWithHashMap<const ConstantNode *> node_to_constants;
+        QueryTreeNodePtrWithHashMap<const ConstantNode *> equals_node_to_constants;
+        QueryTreeNodePtrWithHashMap<QueryTreeNodeConstRawPtrWithHashSet> not_equals_node_to_constants;
+        QueryTreeNodePtrWithHashMap<QueryTreeNodes> node_to_not_equals_functions;
 
         for (const auto & argument : function_node.getArguments())
         {
             auto * argument_function = argument->as<FunctionNode>();
-            if (!argument_function || argument_function->getFunctionName() != "equals")
+            const auto valid_functions = std::unordered_set<std::string>{"equals", "notEquals"};
+            if (!argument_function || !valid_functions.contains(argument_function->getFunctionName()))
             {
                 and_operands.push_back(argument);
                 continue;
             }
 
-            const auto & equals_arguments = argument_function->getArguments().getNodes();
-            const auto & lhs = equals_arguments[0];
-            const auto & rhs = equals_arguments[1];
+            const auto function_name = argument_function->getFunctionName();
+            const auto & function_arguments = argument_function->getArguments().getNodes();
+            const auto & lhs = function_arguments[0];
+            const auto & rhs = function_arguments[1];
 
-            const auto has_and_with_different_constant = [&](const QueryTreeNodePtr & expression, const ConstantNode * constant)
+            if (function_name == "equals")
             {
-                if (auto it = node_to_constants.find(expression); it != node_to_constants.end())
+                const auto has_and_with_different_constant = [&](const QueryTreeNodePtr & expression, const ConstantNode * constant)
                 {
-                    if (!it->second->isEqual(*constant))
-                        return true;
+                    if (auto it = equals_node_to_constants.find(expression); it != equals_node_to_constants.end())
+                    {
+                        if (!it->second->isEqual(*constant))
+                            return true;
+                    }
+                    else
+                    {
+                        equals_node_to_constants.emplace(expression, constant);
+                        and_operands.push_back(argument);
+                    }
+
+                    return false;
+                };
+
+                bool collapse_to_false = false;
+
+                if (const auto * lhs_literal = lhs->as<ConstantNode>())
+                    collapse_to_false = has_and_with_different_constant(rhs, lhs_literal);
+                else if (const auto * rhs_literal = rhs->as<ConstantNode>())
+                    collapse_to_false = has_and_with_different_constant(lhs, rhs_literal);
+                else
+                    and_operands.push_back(argument);
+
+                if (collapse_to_false)
+                {
+                    auto false_value = std::make_shared<ConstantValue>(0u, function_node.getResultType());
+                    auto false_node = std::make_shared<ConstantNode>(std::move(false_value));
+                    node = std::move(false_node);
+                    return;
+                }
+            }
+            else if (function_name == "notEquals")
+            {
+                 /// collect all inequality checks (x <> value)
+
+                const auto add_not_equals_function_if_not_present = [&](const auto & expression_node, const ConstantNode * constant)
+                {
+                    auto & constant_set = not_equals_node_to_constants[expression_node];
+                    if (!constant_set.contains(constant))
+                    {
+                        constant_set.insert(constant);
+                        node_to_not_equals_functions[expression_node].push_back(argument);
+                    }
+                };
+
+                if (const auto * lhs_literal = lhs->as<ConstantNode>();
+                    lhs_literal && !lhs_literal->getValue().isNull())
+                    add_not_equals_function_if_not_present(rhs, lhs_literal);
+                else if (const auto * rhs_literal = rhs->as<ConstantNode>();
+                        rhs_literal && !rhs_literal->getValue().isNull())
+                    add_not_equals_function_if_not_present(lhs, rhs_literal);
+                else
+                    and_operands.push_back(argument);
+            }
+            else
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Unexpected function name: '{}'", function_name);
+        }
+
+        auto not_in_function_resolver = FunctionFactory::instance().get("notIn", getContext());
+
+        for (auto & [expression, not_equals_functions] : node_to_not_equals_functions)
+        {
+            const auto & settings = getSettings();
+            if (not_equals_functions.size() < settings.optimize_min_inequality_conjunction_chain_length && !expression.node->getResultType()->lowCardinality())
+            {
+                std::move(not_equals_functions.begin(), not_equals_functions.end(), std::back_inserter(and_operands));
+                continue;
+            }
+
+            Tuple args;
+            args.reserve(not_equals_functions.size());
+            /// first we create tuple from RHS of notEquals functions
+            for (const auto & not_equals : not_equals_functions)
+            {
+                const auto * not_equals_function = not_equals->as<FunctionNode>();
+                assert(not_equals_function && not_equals_function->getFunctionName() == "notEquals");
+
+                const auto & not_equals_arguments = not_equals_function->getArguments().getNodes();
+                if (const auto * rhs_literal = not_equals_arguments[1]->as<ConstantNode>())
+                {
+                    args.push_back(rhs_literal->getValue());
                 }
                 else
                 {
-                    node_to_constants.emplace(expression, constant);
-                    and_operands.push_back(argument);
+                    const auto * lhs_literal = not_equals_arguments[0]->as<ConstantNode>();
+                    assert(lhs_literal);
+                    args.push_back(lhs_literal->getValue());
                 }
-
-                return false;
-            };
-
-            bool collapse_to_false = false;
-
-            if (const auto * lhs_literal = lhs->as<ConstantNode>())
-                collapse_to_false = has_and_with_different_constant(rhs, lhs_literal);
-            else if (const auto * rhs_literal = rhs->as<ConstantNode>())
-                collapse_to_false = has_and_with_different_constant(lhs, rhs_literal);
-            else
-                and_operands.push_back(argument);
-
-            if (collapse_to_false)
-            {
-                auto false_value = std::make_shared<ConstantValue>(0u, function_node.getResultType());
-                auto false_node = std::make_shared<ConstantNode>(std::move(false_value));
-                node = std::move(false_node);
-                return;
             }
+
+            auto rhs_node = std::make_shared<ConstantNode>(std::move(args));
+
+            auto not_in_function = std::make_shared<FunctionNode>("notIn");
+
+            QueryTreeNodes not_in_arguments;
+            not_in_arguments.reserve(2);
+            not_in_arguments.push_back(expression.node);
+            not_in_arguments.push_back(std::move(rhs_node));
+
+            not_in_function->getArguments().getNodes() = std::move(not_in_arguments);
+            not_in_function->resolveAsFunction(not_in_function_resolver);
+
+            and_operands.push_back(std::move(not_in_function));
         }
 
         if (and_operands.size() == function_node.getArguments().getNodes().size())
@@ -320,11 +401,21 @@ private:
         {
             /// AND operator can have UInt8 or bool as its type.
             /// bool is used if a bool constant is at least one operand.
-            /// Because we reduce the number of operands here by eliminating the same equality checks,
-            /// the only situation we can end up here is we had AND check where all the equality checks are the same so we know the type is UInt8.
-            /// Otherwise, we will have > 1 operands and we don't have to do anything.
-            assert(!function_node.getResultType()->isNullable() && and_operands[0]->getResultType()->equals(*function_node.getResultType()));
-            node = std::move(and_operands[0]);
+
+            auto operand_type = and_operands[0]->getResultType();
+            auto function_type = function_node.getResultType();
+            assert(!function_type->isNullable());
+            if (!function_type->equals(*operand_type))
+            {
+                /// Result of equality operator can be low cardinality, while AND always returns UInt8.
+                /// In that case we replace `(lc = 1) AND (lc = 1)` with `(lc = 1) AS UInt8`
+                assert(function_type->equals(*removeLowCardinality(operand_type)));
+                node = createCastFunction(std::move(and_operands[0]), function_type, getContext());
+            }
+            else
+            {
+                node = std::move(and_operands[0]);
+            }
             return;
         }
 
@@ -389,11 +480,14 @@ private:
                 continue;
             }
 
+            bool is_any_nullable = false;
             Tuple args;
             args.reserve(equals_functions.size());
             /// first we create tuple from RHS of equals functions
             for (const auto & equals : equals_functions)
             {
+                is_any_nullable |= equals->getResultType()->isNullable();
+
                 const auto * equals_function = equals->as<FunctionNode>();
                 assert(equals_function && equals_function->getFunctionName() == "equals");
 
@@ -421,8 +515,20 @@ private:
 
             in_function->getArguments().getNodes() = std::move(in_arguments);
             in_function->resolveAsFunction(in_function_resolver);
-
-            or_operands.push_back(std::move(in_function));
+            /** For `k :: UInt8`, expression `k = 1 OR k = NULL` with result type Nullable(UInt8)
+              * is replaced with `k IN (1, NULL)` with result type UInt8.
+              * Convert it back to Nullable(UInt8).
+              */
+            if (is_any_nullable && !in_function->getResultType()->isNullable())
+            {
+                auto nullable_result_type = std::make_shared<DataTypeNullable>(in_function->getResultType());
+                auto in_function_nullable = createCastFunction(std::move(in_function), std::move(nullable_result_type), getContext());
+                or_operands.push_back(std::move(in_function_nullable));
+            }
+            else
+            {
+                or_operands.push_back(std::move(in_function));
+            }
         }
 
         if (or_operands.size() == function_node.getArguments().getNodes().size())
diff --git a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h
index 80062f38eac..658f6d767c4 100644
--- a/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h
+++ b/src/Analyzer/Passes/LogicalExpressionOptimizerPass.h
@@ -68,7 +68,25 @@ namespace DB
  * WHERE a = 1 AND b = 'test';
  * -------------------------------
  *
- * 5. Remove unnecessary IS NULL checks in JOIN ON clause
+ * 5. Replaces chains of inequality functions inside an AND with a single NOT IN operator.
+ * The replacement is done if:
+ *  - one of the operands of the inequality function is a constant
+ *  - length of chain is at least 'optimize_min_inequality_conjunction_chain_length' long OR the expression has type of LowCardinality
+ *
+ * E.g. (optimize_min_inequality_conjunction_chain_length = 2)
+ * -------------------------------
+ * SELECT *
+ * FROM table
+ * WHERE a <> 1 AND a <> 2;
+ *
+ * will be transformed into
+ *
+ * SELECT *
+ * FROM TABLE
+ * WHERE a NOT IN (1, 2);
+ * -------------------------------
+ *
+ * 6. Remove unnecessary IS NULL checks in JOIN ON clause
  *   - equality check with explicit IS NULL check replaced with <=> operator
  * -------------------------------
  * SELECT * FROM t1 JOIN t2 ON a = b OR (a IS NULL AND b IS NULL)
@@ -85,7 +103,11 @@ class LogicalExpressionOptimizerPass final : public IQueryTreePass
 public:
     String getName() override { return "LogicalExpressionOptimizer"; }
 
-    String getDescription() override { return "Transform equality chain to a single IN function or a constant if possible"; }
+    String getDescription() override
+    {
+        return "Transforms chains of logical expressions if possible, i.e. "
+            "replace chains of equality functions inside an OR with a single IN operator";
+    }
 
     void run(QueryTreeNodePtr query_tree_node, ContextPtr context) override;
 };
diff --git a/src/Analyzer/Passes/MultiIfToIfPass.cpp b/src/Analyzer/Passes/MultiIfToIfPass.cpp
index 85dd33af8bb..d837795866a 100644
--- a/src/Analyzer/Passes/MultiIfToIfPass.cpp
+++ b/src/Analyzer/Passes/MultiIfToIfPass.cpp
@@ -33,8 +33,17 @@ public:
         if (function_node->getArguments().getNodes().size() != 3)
             return;
 
-        auto result_type = function_node->getResultType();
-        function_node->resolveAsFunction(if_function_ptr->build(function_node->getArgumentColumns()));
+        auto if_function_value = if_function_ptr->build(function_node->getArgumentColumns());
+        if (!if_function_value->getResultType()->equals(*function_node->getResultType()))
+        {
+            /** We faced some corner case, when result type of `if` and `multiIf` are different.
+              * For example, currently `if(NULL`, a, b)` returns type of `a` column,
+              * but multiIf(NULL, a, b) returns supertypetype of `a` and `b`.
+              */
+            return;
+        }
+
+        function_node->resolveAsFunction(std::move(if_function_value));
     }
 
 private:
diff --git a/src/Analyzer/Passes/QueryAnalysisPass.cpp b/src/Analyzer/Passes/QueryAnalysisPass.cpp
index 1e63d5ca8e4..3290d918a8b 100644
--- a/src/Analyzer/Passes/QueryAnalysisPass.cpp
+++ b/src/Analyzer/Passes/QueryAnalysisPass.cpp
@@ -119,6 +119,7 @@ namespace ErrorCodes
     extern const int NUMBER_OF_COLUMNS_DOESNT_MATCH;
     extern const int FUNCTION_CANNOT_HAVE_PARAMETERS;
     extern const int SYNTAX_ERROR;
+    extern const int UNEXPECTED_EXPRESSION;
 }
 
 /** Query analyzer implementation overview. Please check documentation in QueryAnalysisPass.h first.
@@ -1209,6 +1210,8 @@ private:
 
     static void expandGroupByAll(QueryNode & query_tree_node_typed);
 
+    static void expandOrderByAll(QueryNode & query_tree_node_typed);
+
     static std::string
     rewriteAggregateFunctionNameIfNeeded(const std::string & aggregate_function_name, NullsAction action, const ContextPtr & context);
 
@@ -2312,6 +2315,35 @@ void QueryAnalyzer::expandGroupByAll(QueryNode & query_tree_node_typed)
         recursivelyCollectMaxOrdinaryExpressions(node, group_by_nodes);
 }
 
+void QueryAnalyzer::expandOrderByAll(QueryNode & query_tree_node_typed)
+{
+    auto * all_node = query_tree_node_typed.getOrderBy().getNodes()[0]->as<SortNode>();
+    if (!all_node)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Select analyze for not sort node.");
+
+    auto & projection_nodes = query_tree_node_typed.getProjection().getNodes();
+    auto list_node = std::make_shared<ListNode>();
+    list_node->getNodes().reserve(projection_nodes.size());
+
+    for (auto & node : projection_nodes)
+    {
+        if (auto * identifier_node = node->as<IdentifierNode>(); identifier_node != nullptr)
+            if (Poco::toUpper(identifier_node->getIdentifier().getFullName()) == "ALL" || Poco::toUpper(identifier_node->getAlias()) == "ALL")
+                throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
+                    "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
+
+        if (auto * function_node = node->as<FunctionNode>(); function_node != nullptr)
+            if (Poco::toUpper(function_node->getAlias()) == "ALL")
+                throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
+                                "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
+
+        auto sort_node = std::make_shared<SortNode>(node, all_node->getSortDirection(), all_node->getNullsSortDirection());
+        list_node->getNodes().push_back(sort_node);
+    }
+
+    query_tree_node_typed.getOrderByNode() = list_node;
+}
+
 std::string QueryAnalyzer::rewriteAggregateFunctionNameIfNeeded(
     const std::string & aggregate_function_name, NullsAction action, const ContextPtr & context)
 {
@@ -6975,6 +7007,9 @@ void QueryAnalyzer::resolveQuery(const QueryTreeNodePtr & query_node, Identifier
     if (query_node_typed.hasHaving() && query_node_typed.isGroupByWithTotals() && is_rollup_or_cube)
         throw Exception(ErrorCodes::NOT_IMPLEMENTED, "WITH TOTALS and WITH ROLLUP or CUBE are not supported together in presence of HAVING");
 
+    if (settings.enable_order_by_all && query_node_typed.isOrderByAll())
+        expandOrderByAll(query_node_typed);
+
     /// Initialize aliases in query node scope
     QueryExpressionsAliasVisitor visitor(scope);
 
diff --git a/src/Analyzer/QueryNode.h b/src/Analyzer/QueryNode.h
index 82bc72b7411..d8b8741afb2 100644
--- a/src/Analyzer/QueryNode.h
+++ b/src/Analyzer/QueryNode.h
@@ -219,6 +219,18 @@ public:
         is_group_by_all = is_group_by_all_value;
     }
 
+    /// Returns true, if query node has ORDER BY ALL modifier, false otherwise
+    bool isOrderByAll() const
+    {
+        return is_order_by_all;
+    }
+
+    /// Set query node ORDER BY ALL modifier value
+    void setIsOrderByAll(bool is_order_by_all_value)
+    {
+        is_order_by_all = is_order_by_all_value;
+    }
+
     /// Returns true if query node WITH section is not empty, false otherwise
     bool hasWith() const
     {
@@ -590,6 +602,7 @@ private:
     bool is_group_by_with_cube = false;
     bool is_group_by_with_grouping_sets = false;
     bool is_group_by_all = false;
+    bool is_order_by_all = false;
 
     std::string cte_name;
     NamesAndTypes projection_columns;
diff --git a/src/Analyzer/QueryTreeBuilder.cpp b/src/Analyzer/QueryTreeBuilder.cpp
index c541888e5b9..4e2d0ad10a8 100644
--- a/src/Analyzer/QueryTreeBuilder.cpp
+++ b/src/Analyzer/QueryTreeBuilder.cpp
@@ -284,6 +284,7 @@ QueryTreeNodePtr QueryTreeBuilder::buildSelectExpression(const ASTPtr & select_q
     current_query_tree->setIsGroupByWithRollup(select_query_typed.group_by_with_rollup);
     current_query_tree->setIsGroupByWithGroupingSets(select_query_typed.group_by_with_grouping_sets);
     current_query_tree->setIsGroupByAll(select_query_typed.group_by_all);
+    current_query_tree->setIsOrderByAll(select_query_typed.order_by_all);
     current_query_tree->setOriginalAST(select_query);
 
     auto current_context = current_query_tree->getContext();
diff --git a/src/Analyzer/Utils.cpp b/src/Analyzer/Utils.cpp
index 918126e0ccc..f75022220e7 100644
--- a/src/Analyzer/Utils.cpp
+++ b/src/Analyzer/Utils.cpp
@@ -667,4 +667,20 @@ NameSet collectIdentifiersFullNames(const QueryTreeNodePtr & node)
     return out;
 }
 
+QueryTreeNodePtr createCastFunction(QueryTreeNodePtr node, DataTypePtr result_type, ContextPtr context)
+{
+    auto enum_literal = std::make_shared<ConstantValue>(result_type->getName(), std::make_shared<DataTypeString>());
+    auto enum_literal_node = std::make_shared<ConstantNode>(std::move(enum_literal));
+
+    auto cast_function = FunctionFactory::instance().get("_CAST", std::move(context));
+    QueryTreeNodes arguments{ std::move(node), std::move(enum_literal_node) };
+
+    auto function_node = std::make_shared<FunctionNode>("_CAST");
+    function_node->getArguments().getNodes() = std::move(arguments);
+
+    function_node->resolveAsFunction(cast_function->build(function_node->getArgumentColumns()));
+
+    return function_node;
+}
+
 }
diff --git a/src/Analyzer/Utils.h b/src/Analyzer/Utils.h
index 060dc7d8bc0..e3316f5ad6b 100644
--- a/src/Analyzer/Utils.h
+++ b/src/Analyzer/Utils.h
@@ -99,4 +99,7 @@ void rerunFunctionResolve(FunctionNode * function_node, ContextPtr context);
 /// Just collect all identifiers from query tree
 NameSet collectIdentifiersFullNames(const QueryTreeNodePtr & node);
 
+/// Wrap node into `_CAST` function
+QueryTreeNodePtr createCastFunction(QueryTreeNodePtr node, DataTypePtr result_type, ContextPtr context);
+
 }
diff --git a/src/Backups/BackupCoordinationRemote.cpp b/src/Backups/BackupCoordinationRemote.cpp
index 2633e1bedd2..b659887e0da 100644
--- a/src/Backups/BackupCoordinationRemote.cpp
+++ b/src/Backups/BackupCoordinationRemote.cpp
@@ -184,12 +184,12 @@ BackupCoordinationRemote::BackupCoordinationRemote(
             if (my_is_internal)
             {
                 String alive_node_path = my_zookeeper_path + "/stage/alive|" + my_current_host;
-                auto code = zk->tryCreate(alive_node_path, "", zkutil::CreateMode::Ephemeral);
 
-                if (code == Coordination::Error::ZNODEEXISTS)
-                    zk->handleEphemeralNodeExistenceNoFailureInjection(alive_node_path, "");
-                else if (code != Coordination::Error::ZOK)
-                    throw zkutil::KeeperException::fromPath(code, alive_node_path);
+                /// Delete the ephemeral node from the previous connection so we don't have to wait for keeper to do it automatically.
+                zk->tryRemove(alive_node_path);
+
+                zk->createAncestors(alive_node_path);
+                zk->create(alive_node_path, "", zkutil::CreateMode::Ephemeral);
             }
         })
 {
diff --git a/src/Backups/BackupCoordinationStageSync.cpp b/src/Backups/BackupCoordinationStageSync.cpp
index 9b9ddc8515c..2eba3440be9 100644
--- a/src/Backups/BackupCoordinationStageSync.cpp
+++ b/src/Backups/BackupCoordinationStageSync.cpp
@@ -60,12 +60,6 @@ void BackupCoordinationStageSync::set(const String & current_host, const String
         }
         else
         {
-            /// Make an ephemeral node so the initiator can track if the current host is still working.
-            String alive_node_path = zookeeper_path + "/alive|" + current_host;
-            auto code = zookeeper->tryCreate(alive_node_path, "", zkutil::CreateMode::Ephemeral);
-            if (code != Coordination::Error::ZOK && code != Coordination::Error::ZNODEEXISTS)
-                throw zkutil::KeeperException::fromPath(code, alive_node_path);
-
             zookeeper->createIfNotExists(zookeeper_path + "/started|" + current_host, "");
             zookeeper->createIfNotExists(zookeeper_path + "/current|" + current_host + "|" + new_stage, message);
         }
@@ -106,39 +100,36 @@ Strings BackupCoordinationStageSync::waitFor(const Strings & all_hosts, const St
 
 namespace
 {
-    struct UnreadyHostState
+    struct UnreadyHost
     {
+        String host;
         bool started = false;
-        bool alive = false;
     };
 }
 
 struct BackupCoordinationStageSync::State
 {
-    Strings results;
-    std::map<String, UnreadyHostState> unready_hosts;
+    std::optional<Strings> results;
     std::optional<std::pair<String, Exception>> error;
-    std::optional<String> host_terminated;
+    std::optional<String> disconnected_host;
+    std::optional<UnreadyHost> unready_host;
 };
 
 BackupCoordinationStageSync::State BackupCoordinationStageSync::readCurrentState(
-    const Strings & zk_nodes, const Strings & all_hosts, const String & stage_to_wait) const
+    WithRetries::RetriesControlHolder & retries_control_holder,
+    const Strings & zk_nodes,
+    const Strings & all_hosts,
+    const String & stage_to_wait) const
 {
+    auto zookeeper = retries_control_holder.faulty_zookeeper;
+    auto & retries_ctl = retries_control_holder.retries_ctl;
+
     std::unordered_set<std::string_view> zk_nodes_set{zk_nodes.begin(), zk_nodes.end()};
 
     State state;
     if (zk_nodes_set.contains("error"))
     {
-        String errors;
-        {
-            auto holder = with_retries.createRetriesControlHolder("readCurrentState");
-            holder.retries_ctl.retryLoop(
-                [&, &zookeeper = holder.faulty_zookeeper]()
-                {
-                    with_retries.renewZooKeeper(zookeeper);
-                    errors = zookeeper->get(zookeeper_path + "/error");
-                });
-        }
+        String errors = zookeeper->get(zookeeper_path + "/error");
         ReadBufferFromOwnString buf{errors};
         String host;
         readStringBinary(host, buf);
@@ -146,64 +137,50 @@ BackupCoordinationStageSync::State BackupCoordinationStageSync::readCurrentState
         return state;
     }
 
+    std::optional<UnreadyHost> unready_host;
+
     for (const auto & host : all_hosts)
     {
         if (!zk_nodes_set.contains("current|" + host + "|" + stage_to_wait))
         {
-            UnreadyHostState unready_host_state;
             const String started_node_name = "started|" + host;
             const String alive_node_name = "alive|" + host;
-            const String alive_node_path = zookeeper_path + "/" + alive_node_name;
-            unready_host_state.started = zk_nodes_set.contains(started_node_name);
 
-            /// Because we do retries everywhere we can't fully rely on ephemeral nodes anymore.
-            /// Though we recreate "alive" node when reconnecting it might be not enough and race condition is possible.
-            /// And everything we can do here - just retry.
-            /// In worst case when we won't manage to see the alive node for a long time we will just abort the backup.
-            unready_host_state.alive = zk_nodes_set.contains(alive_node_name);
-            if (!unready_host_state.alive)
+            bool started = zk_nodes_set.contains(started_node_name);
+            bool alive = zk_nodes_set.contains(alive_node_name);
+
+            if (!alive)
             {
-                LOG_TRACE(log, "Seems like host ({}) is dead. Will retry the check to confirm", host);
-                auto holder = with_retries.createRetriesControlHolder("readCurrentState::checkAliveNode");
-                holder.retries_ctl.retryLoop(
-                    [&, &zookeeper = holder.faulty_zookeeper]()
-                {
-                    with_retries.renewZooKeeper(zookeeper);
+                /// If the "alive" node doesn't exist then we don't have connection to the corresponding host.
+                /// This node is ephemeral so probably it will be recreated soon. We use zookeeper retries to wait.
+                /// In worst case when we won't manage to see the alive node for a long time we will just abort the backup.
+                const auto * const suffix = retries_ctl.isLastRetry() ? "" : ", will retry";
+                if (started)
+                    retries_ctl.setUserError(Exception(ErrorCodes::FAILED_TO_SYNC_BACKUP_OR_RESTORE,
+                                                       "Lost connection to host {}{}", host, suffix));
+                else
+                    retries_ctl.setUserError(Exception(ErrorCodes::FAILED_TO_SYNC_BACKUP_OR_RESTORE,
+                                                       "No connection to host {} yet{}", host, suffix));
 
-                    if (zookeeper->existsNoFailureInjection(alive_node_path))
-                    {
-                        unready_host_state.alive = true;
-                        return;
-                    }
-
-                    // Retry with backoff. We also check whether it is last retry or no, because we won't to rethrow an exception.
-                    if (!holder.retries_ctl.isLastRetry())
-                        holder.retries_ctl.setKeeperError(Coordination::Error::ZNONODE, "There is no alive node for host {}. Will retry", host);
-                });
+                state.disconnected_host = host;
+                return state;
             }
-            LOG_TRACE(log, "Host ({}) appeared to be {}", host, unready_host_state.alive ? "alive" : "dead");
 
-            state.unready_hosts.emplace(host, unready_host_state);
-            if (!unready_host_state.alive && unready_host_state.started && !state.host_terminated)
-                state.host_terminated = host;
+            if (!unready_host)
+                unready_host.emplace(UnreadyHost{.host = host, .started = started});
         }
     }
 
-    if (state.host_terminated || !state.unready_hosts.empty())
-        return state;
-
-    auto holder = with_retries.createRetriesControlHolder("waitImpl::collectStagesToWait");
-    holder.retries_ctl.retryLoop(
-        [&, &zookeeper = holder.faulty_zookeeper]()
+    if (unready_host)
     {
-        with_retries.renewZooKeeper(zookeeper);
-        Strings results;
+        state.unready_host = std::move(unready_host);
+        return state;
+    }
 
-        for (const auto & host : all_hosts)
-            results.emplace_back(zookeeper->get(zookeeper_path + "/current|" + host + "|" + stage_to_wait));
-
-        state.results = std::move(results);
-    });
+    Strings results;
+    for (const auto & host : all_hosts)
+        results.emplace_back(zookeeper->get(zookeeper_path + "/current|" + host + "|" + stage_to_wait));
+    state.results = std::move(results);
 
     return state;
 }
@@ -229,7 +206,7 @@ Strings BackupCoordinationStageSync::waitImpl(
         auto watch = std::make_shared<Poco::Event>();
         Strings zk_nodes;
         {
-            auto holder = with_retries.createRetriesControlHolder("waitImpl::getChildren");
+            auto holder = with_retries.createRetriesControlHolder("waitImpl");
             holder.retries_ctl.retryLoop(
                 [&, &zookeeper = holder.faulty_zookeeper]()
             {
@@ -237,17 +214,23 @@ Strings BackupCoordinationStageSync::waitImpl(
                 watch->reset();
                 /// Get zk nodes and subscribe on their changes.
                 zk_nodes = zookeeper->getChildren(zookeeper_path, nullptr, watch);
+
+                /// Read the current state of zk nodes.
+                state = readCurrentState(holder, zk_nodes, all_hosts, stage_to_wait);
             });
         }
 
-        /// Read and analyze the current state of zk nodes.
-        state = readCurrentState(zk_nodes, all_hosts, stage_to_wait);
-        if (state.error || state.host_terminated || state.unready_hosts.empty())
-            break; /// Error happened or everything is ready.
+        /// Analyze the current state of zk nodes.
+        chassert(state.results || state.error || state.disconnected_host || state.unready_host);
 
-        /// Log that we will wait
-        const auto & unready_host = state.unready_hosts.begin()->first;
-        LOG_INFO(log, "Waiting on ZooKeeper watch for any node to be changed (currently waiting for host {})", unready_host);
+        if (state.results || state.error || state.disconnected_host)
+            break; /// Everything is ready or error happened.
+
+        /// Log what we will wait.
+        const auto & unready_host = *state.unready_host;
+        LOG_INFO(log, "Waiting on ZooKeeper watch for any node to be changed (currently waiting for host {}{})",
+                 unready_host.host,
+                 (!unready_host.started ? " which didn't start the operation yet" : ""));
 
         /// Wait until `watch_callback` is called by ZooKeeper meaning that zk nodes have changed.
         {
@@ -270,23 +253,23 @@ Strings BackupCoordinationStageSync::waitImpl(
         state.error->second.rethrow();
 
     /// Another host terminated without errors.
-    if (state.host_terminated)
-        throw Exception(ErrorCodes::FAILED_TO_SYNC_BACKUP_OR_RESTORE, "Host {} suddenly stopped working", *state.host_terminated);
+    if (state.disconnected_host)
+        throw Exception(ErrorCodes::FAILED_TO_SYNC_BACKUP_OR_RESTORE, "No connection to host {}", *state.disconnected_host);
 
     /// Something's unready, timeout is probably not enough.
-    if (!state.unready_hosts.empty())
+    if (state.unready_host)
     {
-        const auto & [unready_host, unready_host_state] = *state.unready_hosts.begin();
+        const auto & unready_host = *state.unready_host;
         throw Exception(
             ErrorCodes::FAILED_TO_SYNC_BACKUP_OR_RESTORE,
             "Waited for host {} too long (> {}){}",
-            unready_host,
+            unready_host.host,
             to_string(*timeout),
-            unready_host_state.started ? "" : ": Operation didn't start");
+            unready_host.started ? "" : ": Operation didn't start");
     }
 
     LOG_TRACE(log, "Everything is Ok. All hosts achieved stage {}", stage_to_wait);
-    return state.results;
+    return std::move(*state.results);
 }
 
 }
diff --git a/src/Backups/BackupCoordinationStageSync.h b/src/Backups/BackupCoordinationStageSync.h
index 2efaec46b3a..e34fbcc099b 100644
--- a/src/Backups/BackupCoordinationStageSync.h
+++ b/src/Backups/BackupCoordinationStageSync.h
@@ -29,7 +29,7 @@ private:
     void createRootNodes();
 
     struct State;
-    State readCurrentState(const Strings & zk_nodes, const Strings & all_hosts, const String & stage_to_wait) const;
+    State readCurrentState(WithRetries::RetriesControlHolder & retries_control_holder, const Strings & zk_nodes, const Strings & all_hosts, const String & stage_to_wait) const;
 
     Strings waitImpl(const Strings & all_hosts, const String & stage_to_wait, std::optional<std::chrono::milliseconds> timeout) const;
 
diff --git a/src/Backups/BackupEntriesCollector.cpp b/src/Backups/BackupEntriesCollector.cpp
index a335b92fe3e..564a518689a 100644
--- a/src/Backups/BackupEntriesCollector.cpp
+++ b/src/Backups/BackupEntriesCollector.cpp
@@ -43,14 +43,6 @@ namespace Stage = BackupCoordinationStage;
 
 namespace
 {
-    /// Uppercases the first character of a passed string.
-    String toUpperFirst(const String & str)
-    {
-        String res = str;
-        res[0] = std::toupper(res[0]);
-        return res;
-    }
-
     /// Outputs "table <name>" or "temporary table <name>"
     String tableNameWithTypeToString(const String & database_name, const String & table_name, bool first_upper)
     {
@@ -96,18 +88,19 @@ BackupEntriesCollector::BackupEntriesCollector(
     , read_settings(read_settings_)
     , context(context_)
     , on_cluster_first_sync_timeout(context->getConfigRef().getUInt64("backups.on_cluster_first_sync_timeout", 180000))
-    , collect_metadata_timeout(context->getConfigRef().getUInt64("backups.collect_metadata_timeout", context->getConfigRef().getUInt64("backups.consistent_metadata_snapshot_timeout", 600000)))
+    , collect_metadata_timeout(context->getConfigRef().getUInt64(
+          "backups.collect_metadata_timeout", context->getConfigRef().getUInt64("backups.consistent_metadata_snapshot_timeout", 600000)))
     , attempts_to_collect_metadata_before_sleep(context->getConfigRef().getUInt("backups.attempts_to_collect_metadata_before_sleep", 2))
-    , min_sleep_before_next_attempt_to_collect_metadata(context->getConfigRef().getUInt64("backups.min_sleep_before_next_attempt_to_collect_metadata", 100))
-    , max_sleep_before_next_attempt_to_collect_metadata(context->getConfigRef().getUInt64("backups.max_sleep_before_next_attempt_to_collect_metadata", 5000))
+    , min_sleep_before_next_attempt_to_collect_metadata(
+          context->getConfigRef().getUInt64("backups.min_sleep_before_next_attempt_to_collect_metadata", 100))
+    , max_sleep_before_next_attempt_to_collect_metadata(
+          context->getConfigRef().getUInt64("backups.max_sleep_before_next_attempt_to_collect_metadata", 5000))
     , compare_collected_metadata(context->getConfigRef().getBool("backups.compare_collected_metadata", true))
     , log(&Poco::Logger::get("BackupEntriesCollector"))
     , global_zookeeper_retries_info(
-        "BackupEntriesCollector",
-        log,
-        context->getSettingsRef().backup_restore_keeper_max_retries,
-        context->getSettingsRef().backup_restore_keeper_retry_initial_backoff_ms,
-        context->getSettingsRef().backup_restore_keeper_retry_max_backoff_ms)
+          context->getSettingsRef().backup_restore_keeper_max_retries,
+          context->getSettingsRef().backup_restore_keeper_retry_initial_backoff_ms,
+          context->getSettingsRef().backup_restore_keeper_retry_max_backoff_ms)
     , threadpool(threadpool_)
 {
 }
@@ -164,7 +157,7 @@ BackupEntries BackupEntriesCollector::run()
 
 Strings BackupEntriesCollector::setStage(const String & new_stage, const String & message)
 {
-    LOG_TRACE(log, fmt::runtime(toUpperFirst(new_stage)));
+    LOG_TRACE(log, "Setting stage: {}", new_stage);
     current_stage = new_stage;
 
     backup_coordination->setStage(new_stage, message);
@@ -580,7 +573,7 @@ std::vector<std::pair<ASTPtr, StoragePtr>> BackupEntriesCollector::findTablesInD
     {
         /// Database or table could be replicated - so may use ZooKeeper. We need to retry.
         auto zookeeper_retries_info = global_zookeeper_retries_info;
-        ZooKeeperRetriesControl retries_ctl("getTablesForBackup", zookeeper_retries_info, nullptr);
+        ZooKeeperRetriesControl retries_ctl("getTablesForBackup", log, zookeeper_retries_info, nullptr);
         retries_ctl.retryLoop([&](){ db_tables = database->getTablesForBackup(filter_by_table_name, context); });
     }
     catch (Exception & e)
diff --git a/src/Backups/BackupIO_S3.cpp b/src/Backups/BackupIO_S3.cpp
index fecb97dbbaf..d143d813a2f 100644
--- a/src/Backups/BackupIO_S3.cpp
+++ b/src/Backups/BackupIO_S3.cpp
@@ -48,29 +48,36 @@ namespace
         }
 
         const auto & request_settings = settings.request_settings;
+        const Settings & global_settings = context->getGlobalContext()->getSettingsRef();
+        const Settings & local_settings = context->getSettingsRef();
 
         S3::PocoHTTPClientConfiguration client_configuration = S3::ClientFactory::instance().createClientConfiguration(
             settings.auth_settings.region,
             context->getRemoteHostFilter(),
-            static_cast<unsigned>(context->getGlobalContext()->getSettingsRef().s3_max_redirects),
-            static_cast<unsigned>(context->getGlobalContext()->getSettingsRef().s3_retry_attempts),
-            context->getGlobalContext()->getSettingsRef().enable_s3_requests_logging,
+            static_cast<unsigned>(global_settings.s3_max_redirects),
+            static_cast<unsigned>(global_settings.s3_retry_attempts),
+            global_settings.enable_s3_requests_logging,
             /* for_disk_s3 = */ false,
             request_settings.get_request_throttler,
             request_settings.put_request_throttler,
             s3_uri.uri.getScheme());
 
         client_configuration.endpointOverride = s3_uri.endpoint;
-        client_configuration.maxConnections = static_cast<unsigned>(context->getSettingsRef().s3_max_connections);
+        client_configuration.maxConnections = static_cast<unsigned>(global_settings.s3_max_connections);
         /// Increase connect timeout
         client_configuration.connectTimeoutMs = 10 * 1000;
         /// Requests in backups can be extremely long, set to one hour
         client_configuration.requestTimeoutMs = 60 * 60 * 1000;
-        client_configuration.retryStrategy = std::make_shared<Aws::Client::DefaultRetryStrategy>(request_settings.retry_attempts);
+
+        S3::ClientSettings client_settings{
+            .use_virtual_addressing = s3_uri.is_virtual_hosted_style,
+            .disable_checksum = local_settings.s3_disable_checksum,
+            .gcs_issue_compose_request = context->getConfigRef().getBool("s3.gcs_issue_compose_request", false),
+        };
 
         return S3::ClientFactory::instance().create(
             client_configuration,
-            s3_uri.is_virtual_hosted_style,
+            client_settings,
             credentials.GetAWSAccessKeyId(),
             credentials.GetAWSSecretKey(),
             settings.auth_settings.server_side_encryption_customer_key_base64,
@@ -143,7 +150,7 @@ UInt64 BackupReaderS3::getFileSize(const String & file_name)
 {
     auto objects = listObjects(*client, s3_uri, file_name);
     if (objects.empty())
-        throw Exception(ErrorCodes::S3_ERROR, "Object {} must exist");
+        throw Exception(ErrorCodes::S3_ERROR, "Object {} must exist", file_name);
     return objects[0].GetSize();
 }
 
@@ -296,7 +303,7 @@ UInt64 BackupWriterS3::getFileSize(const String & file_name)
 {
     auto objects = listObjects(*client, s3_uri, file_name);
     if (objects.empty())
-        throw Exception(ErrorCodes::S3_ERROR, "Object {} must exist");
+        throw Exception(ErrorCodes::S3_ERROR, "Object {} must exist", file_name);
     return objects[0].GetSize();
 }
 
diff --git a/src/Backups/BackupImpl.cpp b/src/Backups/BackupImpl.cpp
index 61984d58889..9ac68bc2437 100644
--- a/src/Backups/BackupImpl.cpp
+++ b/src/Backups/BackupImpl.cpp
@@ -157,11 +157,16 @@ BackupImpl::~BackupImpl()
 void BackupImpl::open()
 {
     std::lock_guard lock{mutex};
-    LOG_INFO(log, "{} backup: {}", ((open_mode == OpenMode::WRITE) ? "Writing" : "Reading"), backup_name_for_logging);
-    ProfileEvents::increment((open_mode == OpenMode::WRITE) ? ProfileEvents::BackupsOpenedForWrite : ProfileEvents::BackupsOpenedForRead);
 
-    if (open_mode == OpenMode::WRITE)
+    if (open_mode == OpenMode::READ)
     {
+        ProfileEvents::increment(ProfileEvents::BackupsOpenedForRead);
+        LOG_INFO(log, "Reading backup: {}", backup_name_for_logging);
+    }
+    else
+    {
+        ProfileEvents::increment(ProfileEvents::BackupsOpenedForWrite);
+        LOG_INFO(log, "Writing backup: {}", backup_name_for_logging);
         timestamp = std::time(nullptr);
         if (!uuid)
             uuid = UUIDHelpers::generateV4();
@@ -189,7 +194,7 @@ void BackupImpl::open()
 void BackupImpl::close()
 {
     std::lock_guard lock{mutex};
-    closeArchive();
+    closeArchive(/* finalize= */ false);
 
     if (!is_internal_backup && writer && !writing_finalized)
         removeAllFilesAfterFailure();
@@ -222,8 +227,11 @@ void BackupImpl::openArchive()
     }
 }
 
-void BackupImpl::closeArchive()
+void BackupImpl::closeArchive(bool finalize)
 {
+    if (finalize && archive_writer)
+        archive_writer->finalize();
+
     archive_reader.reset();
     archive_writer.reset();
 }
@@ -978,7 +986,7 @@ void BackupImpl::finalizeWriting()
     {
         LOG_TRACE(log, "Finalizing backup {}", backup_name_for_logging);
         writeBackupMetadata();
-        closeArchive();
+        closeArchive(/* finalize= */ true);
         setCompressedSize();
         removeLockFile();
         LOG_TRACE(log, "Finalized backup {}", backup_name_for_logging);
diff --git a/src/Backups/BackupImpl.h b/src/Backups/BackupImpl.h
index 6070db79aa6..b369fe00171 100644
--- a/src/Backups/BackupImpl.h
+++ b/src/Backups/BackupImpl.h
@@ -89,7 +89,7 @@ private:
     void close();
 
     void openArchive();
-    void closeArchive();
+    void closeArchive(bool finalize);
 
     /// Writes the file ".backup" containing backup's metadata.
     void writeBackupMetadata() TSA_REQUIRES(mutex);
diff --git a/src/Backups/BackupInfo.cpp b/src/Backups/BackupInfo.cpp
index f993d7ed984..2bff400d4fe 100644
--- a/src/Backups/BackupInfo.cpp
+++ b/src/Backups/BackupInfo.cpp
@@ -78,13 +78,16 @@ BackupInfo BackupInfo::fromAST(const IAST & ast)
             }
         }
 
-        res.args.reserve(list->children.size() - index);
-        for (; index < list->children.size(); ++index)
+        size_t args_size = list->children.size();
+        res.args.reserve(args_size - index);
+        for (; index < args_size; ++index)
         {
             const auto & elem = list->children[index];
             const auto * lit = elem->as<const ASTLiteral>();
             if (!lit)
+            {
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "Expected literal, got {}", serializeAST(*elem));
+            }
             res.args.push_back(lit->value);
         }
     }
diff --git a/src/Backups/BackupOperationInfo.h b/src/Backups/BackupOperationInfo.h
index 54f5e5e9965..e57b57d75f1 100644
--- a/src/Backups/BackupOperationInfo.h
+++ b/src/Backups/BackupOperationInfo.h
@@ -17,6 +17,9 @@ struct BackupOperationInfo
     /// Operation name, a string like "Disk('backups', 'my_backup')"
     String name;
 
+    /// Base Backup Operation name, a string like "Disk('backups', 'my_base_backup')"
+    String base_backup_name;
+
     /// This operation is internal and should not be shown in system.backups
     bool internal = false;
 
diff --git a/src/Backups/BackupsWorker.cpp b/src/Backups/BackupsWorker.cpp
index a1f619af0a4..8c4bb7e414c 100644
--- a/src/Backups/BackupsWorker.cpp
+++ b/src/Backups/BackupsWorker.cpp
@@ -394,9 +394,13 @@ OperationID BackupsWorker::startMakingBackup(const ASTPtr & query, const Context
 
     auto backup_info = BackupInfo::fromAST(*backup_query->backup_name);
     String backup_name_for_logging = backup_info.toStringForLogging();
+    String base_backup_name;
+    if (backup_settings.base_backup_info)
+        base_backup_name = backup_settings.base_backup_info->toString();
+
     try
     {
-        addInfo(backup_id, backup_name_for_logging, backup_settings.internal, BackupStatus::CREATING_BACKUP);
+        addInfo(backup_id, backup_name_for_logging, base_backup_name, backup_settings.internal, BackupStatus::CREATING_BACKUP);
 
         /// Prepare context to use.
         ContextPtr context_in_use = context;
@@ -606,7 +610,6 @@ void BackupsWorker::doBackup(
 
 void BackupsWorker::buildFileInfosForBackupEntries(const BackupPtr & backup, const BackupEntries & backup_entries, const ReadSettings & read_settings, std::shared_ptr<IBackupCoordination> backup_coordination)
 {
-    LOG_TRACE(log, "{}", Stage::BUILDING_FILE_INFOS);
     backup_coordination->setStage(Stage::BUILDING_FILE_INFOS, "");
     backup_coordination->waitForStage(Stage::BUILDING_FILE_INFOS);
     backup_coordination->addFileInfos(::DB::buildFileInfosForBackupEntries(backup_entries, backup->getBaseBackup(), read_settings, getThreadPool(ThreadPoolId::BACKUP_MAKE_FILES_LIST)));
@@ -745,8 +748,11 @@ OperationID BackupsWorker::startRestoring(const ASTPtr & query, ContextMutablePt
     {
         auto backup_info = BackupInfo::fromAST(*restore_query->backup_name);
         String backup_name_for_logging = backup_info.toStringForLogging();
+        String base_backup_name;
+        if (restore_settings.base_backup_info)
+            base_backup_name = restore_settings.base_backup_info->toString();
 
-        addInfo(restore_id, backup_name_for_logging, restore_settings.internal, BackupStatus::RESTORING);
+        addInfo(restore_id, backup_name_for_logging, base_backup_name, restore_settings.internal, BackupStatus::RESTORING);
 
         /// Prepare context to use.
         ContextMutablePtr context_in_use = context;
@@ -1005,11 +1011,12 @@ void BackupsWorker::restoreTablesData(const OperationID & restore_id, BackupPtr
 }
 
 
-void BackupsWorker::addInfo(const OperationID & id, const String & name, bool internal, BackupStatus status)
+void BackupsWorker::addInfo(const OperationID & id, const String & name, const String & base_backup_name, bool internal, BackupStatus status)
 {
     BackupOperationInfo info;
     info.id = id;
     info.name = name;
+    info.base_backup_name = base_backup_name;
     info.internal = internal;
     info.status = status;
     info.start_time = std::chrono::system_clock::now();
diff --git a/src/Backups/BackupsWorker.h b/src/Backups/BackupsWorker.h
index b0a76eb0fa8..e2bd076314f 100644
--- a/src/Backups/BackupsWorker.h
+++ b/src/Backups/BackupsWorker.h
@@ -83,7 +83,7 @@ private:
     /// Run data restoring tasks which insert data to tables.
     void restoreTablesData(const BackupOperationID & restore_id, BackupPtr backup, DataRestoreTasks && tasks, ThreadPool & thread_pool);
 
-    void addInfo(const BackupOperationID & id, const String & name, bool internal, BackupStatus status);
+    void addInfo(const BackupOperationID & id, const String & name, const String & base_backup_name, bool internal, BackupStatus status);
     void setStatus(const BackupOperationID & id, BackupStatus status, bool throw_if_error = true);
     void setStatusSafe(const String & id, BackupStatus status) { setStatus(id, status, false); }
     void setNumFilesAndSize(const BackupOperationID & id, size_t num_files, UInt64 total_size, size_t num_entries,
diff --git a/src/Backups/RestoreCoordinationRemote.cpp b/src/Backups/RestoreCoordinationRemote.cpp
index 60a83c580f0..190634de4a9 100644
--- a/src/Backups/RestoreCoordinationRemote.cpp
+++ b/src/Backups/RestoreCoordinationRemote.cpp
@@ -43,12 +43,12 @@ RestoreCoordinationRemote::RestoreCoordinationRemote(
             if (my_is_internal)
             {
                 String alive_node_path = my_zookeeper_path + "/stage/alive|" + my_current_host;
-                auto code = zk->tryCreate(alive_node_path, "", zkutil::CreateMode::Ephemeral);
 
-                if (code == Coordination::Error::ZNODEEXISTS)
-                    zk->handleEphemeralNodeExistenceNoFailureInjection(alive_node_path, "");
-                else if (code != Coordination::Error::ZOK)
-                    throw zkutil::KeeperException::fromPath(code, alive_node_path);
+                /// Delete the ephemeral node from the previous connection so we don't have to wait for keeper to do it automatically.
+                zk->tryRemove(alive_node_path);
+
+                zk->createAncestors(alive_node_path);
+                zk->create(alive_node_path, "", zkutil::CreateMode::Ephemeral);
             }
         })
 {
diff --git a/src/Backups/RestorerFromBackup.cpp b/src/Backups/RestorerFromBackup.cpp
index 026671edd6a..4e580e493a7 100644
--- a/src/Backups/RestorerFromBackup.cpp
+++ b/src/Backups/RestorerFromBackup.cpp
@@ -43,14 +43,6 @@ namespace Stage = BackupCoordinationStage;
 
 namespace
 {
-    /// Uppercases the first character of a passed string.
-    String toUpperFirst(const String & str)
-    {
-        String res = str;
-        res[0] = std::toupper(res[0]);
-        return res;
-    }
-
     /// Outputs "table <name>" or "temporary table <name>"
     String tableNameWithTypeToString(const String & database_name, const String & table_name, bool first_upper)
     {
@@ -145,7 +137,7 @@ RestorerFromBackup::DataRestoreTasks RestorerFromBackup::run(Mode mode)
 
 void RestorerFromBackup::setStage(const String & new_stage, const String & message)
 {
-    LOG_TRACE(log, fmt::runtime(toUpperFirst(new_stage)));
+    LOG_TRACE(log, "Setting stage: {}", new_stage);
     current_stage = new_stage;
 
     if (restore_coordination)
diff --git a/src/Backups/WithRetries.cpp b/src/Backups/WithRetries.cpp
index 40ae8d06462..55809dc6958 100644
--- a/src/Backups/WithRetries.cpp
+++ b/src/Backups/WithRetries.cpp
@@ -20,22 +20,19 @@ WithRetries::KeeperSettings WithRetries::KeeperSettings::fromContext(ContextPtr
     };
 }
 
-WithRetries::WithRetries(Poco::Logger * log_, zkutil::GetZooKeeper get_zookeeper_, const KeeperSettings & settings_, RenewerCallback callback_)
+WithRetries::WithRetries(
+    Poco::Logger * log_, zkutil::GetZooKeeper get_zookeeper_, const KeeperSettings & settings_, RenewerCallback callback_)
     : log(log_)
     , get_zookeeper(get_zookeeper_)
     , settings(settings_)
     , callback(callback_)
     , global_zookeeper_retries_info(
-        log->name(),
-        log,
-        settings.keeper_max_retries,
-        settings.keeper_retry_initial_backoff_ms,
-        settings.keeper_retry_max_backoff_ms)
+          settings.keeper_max_retries, settings.keeper_retry_initial_backoff_ms, settings.keeper_retry_max_backoff_ms)
 {}
 
 WithRetries::RetriesControlHolder::RetriesControlHolder(const WithRetries * parent, const String & name)
     : info(parent->global_zookeeper_retries_info)
-    , retries_ctl(name, info, nullptr)
+    , retries_ctl(name, parent->log, info, nullptr)
     , faulty_zookeeper(parent->getFaultyZooKeeper())
 {}
 
diff --git a/src/BridgeHelper/LibraryBridgeHelper.cpp b/src/BridgeHelper/LibraryBridgeHelper.cpp
index 60588951c32..e83707595b9 100644
--- a/src/BridgeHelper/LibraryBridgeHelper.cpp
+++ b/src/BridgeHelper/LibraryBridgeHelper.cpp
@@ -12,7 +12,7 @@ LibraryBridgeHelper::LibraryBridgeHelper(ContextPtr context_)
     , http_timeout(context_->getGlobalContext()->getSettingsRef().http_receive_timeout.value)
     , bridge_host(config.getString("library_bridge.host", DEFAULT_HOST))
     , bridge_port(config.getUInt("library_bridge.port", DEFAULT_PORT))
-    , http_timeouts(ConnectionTimeouts::getHTTPTimeouts(context_->getSettingsRef(), {context_->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0}))
+    , http_timeouts(ConnectionTimeouts::getHTTPTimeouts(context_->getSettingsRef(), context_->getServerSettings().keep_alive_timeout))
 {
 }
 
diff --git a/src/BridgeHelper/XDBCBridgeHelper.h b/src/BridgeHelper/XDBCBridgeHelper.h
index 44104f26f63..060de74b5b1 100644
--- a/src/BridgeHelper/XDBCBridgeHelper.h
+++ b/src/BridgeHelper/XDBCBridgeHelper.h
@@ -162,7 +162,7 @@ private:
 
     ConnectionTimeouts getHTTPTimeouts()
     {
-        return ConnectionTimeouts::getHTTPTimeouts(getContext()->getSettingsRef(), {getContext()->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0});
+        return ConnectionTimeouts::getHTTPTimeouts(getContext()->getSettingsRef(), getContext()->getServerSettings().keep_alive_timeout);
     }
 
 protected:
diff --git a/src/CMakeLists.txt b/src/CMakeLists.txt
index 6063c701708..86cb9acd056 100644
--- a/src/CMakeLists.txt
+++ b/src/CMakeLists.txt
@@ -226,6 +226,7 @@ add_object_library(clickhouse_storages_statistics Storages/Statistics)
 add_object_library(clickhouse_storages_liveview Storages/LiveView)
 add_object_library(clickhouse_storages_windowview Storages/WindowView)
 add_object_library(clickhouse_storages_s3queue Storages/S3Queue)
+add_object_library(clickhouse_storages_materializedview Storages/MaterializedView)
 add_object_library(clickhouse_client Client)
 add_object_library(clickhouse_bridge BridgeHelper)
 add_object_library(clickhouse_server Server)
diff --git a/src/Client/ClientBase.cpp b/src/Client/ClientBase.cpp
index c9fe038d3b1..e099aac0de9 100644
--- a/src/Client/ClientBase.cpp
+++ b/src/Client/ClientBase.cpp
@@ -318,14 +318,14 @@ void ClientBase::setupSignalHandler()
     sigemptyset(&new_act.sa_mask);
 #else
     if (sigemptyset(&new_act.sa_mask))
-        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler");
 #endif
 
     if (sigaction(SIGINT, &new_act, nullptr))
-        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler");
 
     if (sigaction(SIGQUIT, &new_act, nullptr))
-        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler");
 }
 
 
@@ -543,16 +543,16 @@ try
         if (!pager.empty())
         {
             if (SIG_ERR == signal(SIGPIPE, SIG_IGN))
-                throwFromErrno("Cannot set signal handler for SIGPIPE.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+                throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler for SIGPIPE");
             /// We need to reset signals that had been installed in the
             /// setupSignalHandler() since terminal will send signals to both
             /// processes and so signals will be delivered to the
             /// clickhouse-client/local as well, which will be terminated when
             /// signal will be delivered second time.
             if (SIG_ERR == signal(SIGINT, SIG_IGN))
-                throwFromErrno("Cannot set signal handler for SIGINT.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+                throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler for SIGINT");
             if (SIG_ERR == signal(SIGQUIT, SIG_IGN))
-                throwFromErrno("Cannot set signal handler for SIGQUIT.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+                throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler for SIGQUIT");
 
             ShellCommand::Config config(pager);
             config.pipe_stdin_only = true;
@@ -1306,11 +1306,11 @@ void ClientBase::resetOutput()
         pager_cmd->wait();
 
         if (SIG_ERR == signal(SIGPIPE, SIG_DFL))
-            throwFromErrno("Cannot set signal handler for SIIGPIEP.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+            throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler for SIGPIPE");
         if (SIG_ERR == signal(SIGINT, SIG_DFL))
-            throwFromErrno("Cannot set signal handler for SIGINT.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+            throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler for SIGINT");
         if (SIG_ERR == signal(SIGQUIT, SIG_DFL))
-            throwFromErrno("Cannot set signal handler for SIGQUIT.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+            throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler for SIGQUIT");
 
         setupSignalHandler();
     }
@@ -2566,7 +2566,7 @@ bool ClientBase::processMultiQueryFromFile(const String & file_name)
     ReadBufferFromFile in(file_name);
     readStringUntilEOF(queries_from_file, in);
 
-    if (!global_context->getSettings().log_comment.changed)
+    if (!has_log_comment)
     {
         Settings settings = global_context->getSettings();
         /// NOTE: cannot use even weakly_canonical() since it fails for /dev/stdin due to resolving of "pipe:[X]"
@@ -3005,6 +3005,8 @@ void ClientBase::init(int argc, char ** argv)
         total_memory_tracker.setDescription("(total)");
         total_memory_tracker.setMetric(CurrentMetrics::MemoryTracking);
     }
+
+    has_log_comment = config().has("log_comment");
 }
 
 }
diff --git a/src/Client/ClientBase.h b/src/Client/ClientBase.h
index 4eed8e0ace3..dd08e7c059b 100644
--- a/src/Client/ClientBase.h
+++ b/src/Client/ClientBase.h
@@ -321,6 +321,9 @@ protected:
     bool allow_merge_tree_settings = false;
 
     bool cancelled = false;
+
+    /// Does log_comment has specified by user?
+    bool has_log_comment = false;
 };
 
 }
diff --git a/src/Client/LineReader.cpp b/src/Client/LineReader.cpp
index 2ec90240fd1..b3559657ced 100644
--- a/src/Client/LineReader.cpp
+++ b/src/Client/LineReader.cpp
@@ -7,7 +7,7 @@
 #include <cassert>
 #include <cstring>
 #include <unistd.h>
-#include <sys/select.h>
+#include <poll.h>
 #include <sys/time.h>
 #include <sys/types.h>
 
@@ -27,11 +27,8 @@ void trim(String & s)
 /// Allows delaying the start of query execution until the entirety of query is inserted.
 bool hasInputData()
 {
-    timeval timeout = {0, 0};
-    fd_set fds{};
-    FD_ZERO(&fds);
-    FD_SET(STDIN_FILENO, &fds);
-    return select(1, &fds, nullptr, nullptr, &timeout) == 1;
+    pollfd fd{STDIN_FILENO, POLLIN, 0};
+    return poll(&fd, 1, 0) == 1;
 }
 
 struct NoCaseCompare
diff --git a/src/Client/LocalConnection.cpp b/src/Client/LocalConnection.cpp
index 849308155b0..dbb115f44ef 100644
--- a/src/Client/LocalConnection.cpp
+++ b/src/Client/LocalConnection.cpp
@@ -201,7 +201,7 @@ void LocalConnection::sendQuery(
     catch (...)
     {
         state->io.onException();
-        state->exception = std::make_unique<Exception>(ErrorCodes::UNKNOWN_EXCEPTION, "Unknown exception");
+        state->exception = std::make_unique<Exception>(Exception(ErrorCodes::UNKNOWN_EXCEPTION, "Unknown exception"));
     }
 }
 
@@ -311,7 +311,7 @@ bool LocalConnection::poll(size_t)
         catch (...)
         {
             state->io.onException();
-            state->exception = std::make_unique<Exception>(ErrorCodes::UNKNOWN_EXCEPTION, "Unknown exception");
+            state->exception = std::make_unique<Exception>(Exception(ErrorCodes::UNKNOWN_EXCEPTION, "Unknown exception"));
         }
     }
 
diff --git a/src/Client/ReplxxLineReader.cpp b/src/Client/ReplxxLineReader.cpp
index 8ebbbf9ce94..9e0f5946205 100644
--- a/src/Client/ReplxxLineReader.cpp
+++ b/src/Client/ReplxxLineReader.cpp
@@ -6,6 +6,7 @@
 #include <IO/copyData.h>
 
 #include <algorithm>
+#include <cstdlib>
 #include <stdexcept>
 #include <chrono>
 #include <cerrno>
@@ -21,6 +22,7 @@
 #include <fstream>
 #include <filesystem>
 #include <fmt/format.h>
+#include <Common/quoteString.h>
 #include "config.h" // USE_SKIM
 
 #if USE_SKIM
@@ -94,7 +96,14 @@ int executeCommand(char * const argv[])
         throw std::runtime_error(fmt::format("Cannot waitpid {}: {}", pid, errnoToString()));
     } while (true);
 
-    return status;
+    if (WIFEXITED(status))
+        return WEXITSTATUS(status);
+    if (WIFSIGNALED(status))
+        throw std::runtime_error(fmt::format("Child process was terminated by signal {}", WTERMSIG(status)));
+    if (WIFSTOPPED(status))
+        throw std::runtime_error(fmt::format("Child process was stopped by signal {}", WSTOPSIG(status)));
+
+    throw std::runtime_error("Child process was not exited normally by unknown reason");
 }
 
 void writeRetry(int fd, const std::string & data)
@@ -504,22 +513,29 @@ void ReplxxLineReader::addToHistory(const String & line)
 
 void ReplxxLineReader::openEditor()
 {
-    TemporaryFile editor_file("clickhouse_client_editor_XXXXXX.sql");
-    editor_file.write(rx.get_state().text());
-    editor_file.close();
-
-    char * const argv[] = {editor.data(), editor_file.getPath().data(), nullptr};
     try
     {
-        if (executeCommand(argv) == 0)
+        TemporaryFile editor_file("clickhouse_client_editor_XXXXXX.sql");
+        editor_file.write(rx.get_state().text());
+        editor_file.close();
+
+        char * const argv[] = {editor.data(), editor_file.getPath().data(), nullptr};
+
+        int editor_exit_code = executeCommand(argv);
+        if (editor_exit_code == EXIT_SUCCESS)
         {
             const std::string & new_query = readFile(editor_file.getPath());
             rx.set_state(replxx::Replxx::State(new_query.c_str(), static_cast<int>(new_query.size())));
         }
+        else
+        {
+            rx.print(fmt::format("Editor {} terminated unsuccessfully: {}\n", backQuoteIfNeed(editor), editor_exit_code).data());
+        }
     }
     catch (const std::runtime_error & e)
     {
         rx.print(e.what());
+        rx.print("\n");
     }
 
     if (bracketed_paste_enabled)
diff --git a/src/Client/Suggest.cpp b/src/Client/Suggest.cpp
index c7ebcac1264..836c03d81ff 100644
--- a/src/Client/Suggest.cpp
+++ b/src/Client/Suggest.cpp
@@ -48,7 +48,7 @@ Suggest::Suggest()
               "GRANT",        "REVOKE",        "OPTION",       "ADMIN",      "EXCEPT",   "REPLACE",     "IDENTIFIED", "HOST",
               "NAME",         "READONLY",      "WRITABLE",     "PERMISSIVE", "FOR",      "RESTRICTIVE", "RANDOMIZED", "INTERVAL",
               "LIMITS",       "ONLY",          "TRACKING",     "IP",         "REGEXP",   "ILIKE",       "CLEANUP",    "APPEND",
-              "IGNORE NULLS", "RESPECT NULLS", "OVER"});
+              "IGNORE NULLS", "RESPECT NULLS", "OVER",         "PASTE"});
 }
 
 static String getLoadSuggestionQuery(Int32 suggestion_limit, bool basic_suggestion)
@@ -77,6 +77,7 @@ static String getLoadSuggestionQuery(Int32 suggestion_limit, bool basic_suggesti
     };
 
     add_column("name", "functions", false, {});
+    add_column("name", "database_engines", false, {});
     add_column("name", "table_engines", false, {});
     add_column("name", "formats", false, {});
     add_column("name", "table_functions", false, {});
diff --git a/src/Columns/ColumnCompressed.cpp b/src/Columns/ColumnCompressed.cpp
index 9fb7b108501..3bdc514d6d8 100644
--- a/src/Columns/ColumnCompressed.cpp
+++ b/src/Columns/ColumnCompressed.cpp
@@ -1,4 +1,5 @@
 #include <Columns/ColumnCompressed.h>
+#include <Common/formatReadable.h>
 
 #pragma clang diagnostic ignored "-Wold-style-cast"
 
diff --git a/src/Columns/ColumnFunction.cpp b/src/Columns/ColumnFunction.cpp
index 7c7b87bf4a6..d8eea26b7d5 100644
--- a/src/Columns/ColumnFunction.cpp
+++ b/src/Columns/ColumnFunction.cpp
@@ -248,7 +248,7 @@ void ColumnFunction::appendArguments(const ColumnsWithTypeAndName & columns)
     auto wanna_capture = columns.size();
 
     if (were_captured + wanna_capture > args)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot capture {} columns because function {} has {} arguments{}.",
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot capture {} column(s) because function {} has {} arguments{}.",
                         wanna_capture, function->getName(), args,
                         (were_captured ? " and " + toString(were_captured) + " columns have already been captured" : ""));
 
diff --git a/src/Columns/ColumnFunction.h b/src/Columns/ColumnFunction.h
index c21e88744e0..efcdc4e4419 100644
--- a/src/Columns/ColumnFunction.h
+++ b/src/Columns/ColumnFunction.h
@@ -5,6 +5,7 @@
 #include <Core/ColumnsWithTypeAndName.h>
 #include <Columns/IColumn.h>
 
+
 namespace DB
 {
 namespace ErrorCodes
@@ -16,7 +17,7 @@ class IFunctionBase;
 using FunctionBasePtr = std::shared_ptr<const IFunctionBase>;
 
 /** A column containing a lambda expression.
-  * Behaves like a constant-column. Contains an expression, but not input or output data.
+  * Contains an expression and captured columns, but not input arguments.
   */
 class ColumnFunction final : public COWHelper<IColumn, ColumnFunction>
 {
@@ -207,8 +208,6 @@ private:
     bool is_function_compiled;
 
     void appendArgument(const ColumnWithTypeAndName & column);
-
-    void addOffsetsForReplication(const IColumn::Offsets & offsets);
 };
 
 const ColumnFunction * checkAndGetShortCircuitArgument(const ColumnPtr & column);
diff --git a/src/Columns/IColumnDummy.cpp b/src/Columns/IColumnDummy.cpp
index 42b66e1156c..01091a87049 100644
--- a/src/Columns/IColumnDummy.cpp
+++ b/src/Columns/IColumnDummy.cpp
@@ -1,4 +1,5 @@
 #include <Common/Arena.h>
+#include <Core/Field.h>
 #include <Columns/IColumnDummy.h>
 #include <Columns/ColumnsCommon.h>
 
diff --git a/src/Columns/tests/gtest_column_vector.cpp b/src/Columns/tests/gtest_column_vector.cpp
index 14bf36434b6..b71d4a095ab 100644
--- a/src/Columns/tests/gtest_column_vector.cpp
+++ b/src/Columns/tests/gtest_column_vector.cpp
@@ -4,6 +4,7 @@
 #include <vector>
 #include <Columns/ColumnsNumber.h>
 #include <Common/randomSeed.h>
+#include <Common/thread_local_rng.h>
 #include <gtest/gtest.h>
 
 using namespace DB;
diff --git a/src/Common/AlignedBuffer.cpp b/src/Common/AlignedBuffer.cpp
index f1d3f98ff3a..5e11f16f106 100644
--- a/src/Common/AlignedBuffer.cpp
+++ b/src/Common/AlignedBuffer.cpp
@@ -18,9 +18,11 @@ void AlignedBuffer::alloc(size_t size, size_t alignment)
     void * new_buf;
     int res = ::posix_memalign(&new_buf, std::max(alignment, sizeof(void*)), size);
     if (0 != res)
-        throwFromErrno(fmt::format("Cannot allocate memory (posix_memalign), size: {}, alignment: {}.",
-            ReadableSize(size), ReadableSize(alignment)),
-            ErrorCodes::CANNOT_ALLOCATE_MEMORY, res);
+        throw ErrnoException(
+            ErrorCodes::CANNOT_ALLOCATE_MEMORY,
+            "Cannot allocate memory (posix_memalign), size: {}, alignment: {}.",
+            ReadableSize(size),
+            ReadableSize(alignment));
     buf = new_buf;
 }
 
diff --git a/src/Common/Allocator.cpp b/src/Common/Allocator.cpp
index 2e00b157621..c4137920395 100644
--- a/src/Common/Allocator.cpp
+++ b/src/Common/Allocator.cpp
@@ -1,9 +1,190 @@
-#include "Allocator.h"
+#include <Common/Allocator.h>
+#include <Common/Exception.h>
+#include <Common/logger_useful.h>
+#include <Common/formatReadable.h>
+#include <Common/CurrentMemoryTracker.h>
+
+#include <base/errnoToString.h>
+#include <base/getPageSize.h>
+
+#include <Poco/Logger.h>
+#include <sys/mman.h> /// MADV_POPULATE_WRITE
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int CANNOT_ALLOCATE_MEMORY;
+    extern const int LOGICAL_ERROR;
+}
+
+}
+
+namespace
+{
+
+using namespace DB;
+
+#if defined(MADV_POPULATE_WRITE)
+/// Address passed to madvise is required to be aligned to the page boundary.
+auto adjustToPageSize(void * buf, size_t len, size_t page_size)
+{
+    const uintptr_t address_numeric = reinterpret_cast<uintptr_t>(buf);
+    const size_t next_page_start = ((address_numeric + page_size - 1) / page_size) * page_size;
+    return std::make_pair(reinterpret_cast<void *>(next_page_start), len - (next_page_start - address_numeric));
+}
+#endif
+
+void prefaultPages([[maybe_unused]] void * buf_, [[maybe_unused]] size_t len_)
+{
+#if defined(MADV_POPULATE_WRITE)
+    if (len_ < POPULATE_THRESHOLD)
+        return;
+
+    static const size_t page_size = ::getPageSize();
+    if (len_ < page_size) /// Rounded address should be still within [buf, buf + len).
+        return;
+
+    auto [buf, len] = adjustToPageSize(buf_, len_, page_size);
+    if (auto res = ::madvise(buf, len, MADV_POPULATE_WRITE); res < 0)
+        LOG_TRACE(
+            LogFrequencyLimiter(&Poco::Logger::get("Allocator"), 1),
+            "Attempt to populate pages failed: {} (EINVAL is expected for kernels < 5.14)",
+            errnoToString(res));
+#endif
+}
+
+template <bool clear_memory, bool populate>
+void * allocNoTrack(size_t size, size_t alignment)
+{
+    void * buf;
+    if (alignment <= MALLOC_MIN_ALIGNMENT)
+    {
+        if constexpr (clear_memory)
+            buf = ::calloc(size, 1);
+        else
+            buf = ::malloc(size);
+
+        if (nullptr == buf)
+            throw DB::ErrnoException(DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Allocator: Cannot malloc {}.", ReadableSize(size));
+    }
+    else
+    {
+        buf = nullptr;
+        int res = posix_memalign(&buf, alignment, size);
+
+        if (0 != res)
+            throw DB::ErrnoException(
+                DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Cannot allocate memory (posix_memalign) {}.", ReadableSize(size));
+
+        if constexpr (clear_memory)
+            memset(buf, 0, size);
+    }
+
+    if constexpr (populate)
+        prefaultPages(buf, size);
+
+    return buf;
+}
+
+void freeNoTrack(void * buf)
+{
+    ::free(buf);
+}
+
+void checkSize(size_t size)
+{
+    /// More obvious exception in case of possible overflow (instead of just "Cannot mmap").
+    if (size >= 0x8000000000000000ULL)
+        throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Too large size ({}) passed to allocator. It indicates an error.", size);
+}
+
+}
 
 
 /// Constant is chosen almost arbitrarily, what I observed is 128KB is too small, 1MB is almost indistinguishable from 64MB and 1GB is too large.
 extern const size_t POPULATE_THRESHOLD = 16 * 1024 * 1024;
 
+template <bool clear_memory_, bool populate>
+void * Allocator<clear_memory_, populate>::alloc(size_t size, size_t alignment)
+{
+    checkSize(size);
+    auto trace = CurrentMemoryTracker::alloc(size);
+    void * ptr = allocNoTrack<clear_memory_, populate>(size, alignment);
+    trace.onAlloc(ptr, size);
+    return ptr;
+}
+
+
+template <bool clear_memory_, bool populate>
+void Allocator<clear_memory_, populate>::free(void * buf, size_t size)
+{
+    try
+    {
+        checkSize(size);
+        freeNoTrack(buf);
+        auto trace = CurrentMemoryTracker::free(size);
+        trace.onFree(buf, size);
+    }
+    catch (...)
+    {
+        DB::tryLogCurrentException("Allocator::free");
+        throw;
+    }
+}
+
+template <bool clear_memory_, bool populate>
+void * Allocator<clear_memory_, populate>::realloc(void * buf, size_t old_size, size_t new_size, size_t alignment)
+{
+    checkSize(new_size);
+
+    if (old_size == new_size)
+    {
+        /// nothing to do.
+        /// BTW, it's not possible to change alignment while doing realloc.
+    }
+    else if (alignment <= MALLOC_MIN_ALIGNMENT)
+    {
+        /// Resize malloc'd memory region with no special alignment requirement.
+        auto trace_free = CurrentMemoryTracker::free(old_size);
+        auto trace_alloc = CurrentMemoryTracker::alloc(new_size);
+        trace_free.onFree(buf, old_size);
+
+        void * new_buf = ::realloc(buf, new_size);
+        if (nullptr == new_buf)
+        {
+            throw DB::ErrnoException(
+                DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY,
+                "Allocator: Cannot realloc from {} to {}",
+                ReadableSize(old_size),
+                ReadableSize(new_size));
+        }
+
+        buf = new_buf;
+        trace_alloc.onAlloc(buf, new_size);
+
+        if constexpr (clear_memory)
+            if (new_size > old_size)
+                memset(reinterpret_cast<char *>(buf) + old_size, 0, new_size - old_size);
+    }
+    else
+    {
+        /// Big allocs that requires a copy. MemoryTracker is called inside 'alloc', 'free' methods.
+        void * new_buf = alloc(new_size, alignment);
+        memcpy(new_buf, buf, std::min(old_size, new_size));
+        free(buf, old_size);
+        buf = new_buf;
+    }
+
+    if constexpr (populate)
+        prefaultPages(buf, new_size);
+
+    return buf;
+}
+
+
 template class Allocator<false, false>;
 template class Allocator<true, false>;
 template class Allocator<false, true>;
diff --git a/src/Common/Allocator.h b/src/Common/Allocator.h
index a85274e1f69..b865dacc2e9 100644
--- a/src/Common/Allocator.h
+++ b/src/Common/Allocator.h
@@ -8,47 +8,19 @@
     #define ALLOCATOR_ASLR 1
 #endif
 
-#include <pcg_random.hpp>
-#include <Common/thread_local_rng.h>
-
 #if !defined(OS_DARWIN) && !defined(OS_FREEBSD)
 #include <malloc.h>
 #endif
 
-#include <cstdlib>
-#include <algorithm>
-#include <sys/mman.h>
-
 #include <Core/Defines.h>
-#include <base/getPageSize.h>
-
-#include <Common/CurrentMemoryTracker.h>
-#include <Common/CurrentMetrics.h>
-#include <Common/Exception.h>
-#include <Common/formatReadable.h>
-
 #include <Common/Allocator_fwd.h>
-
-#include <base/errnoToString.h>
-#include <Poco/Logger.h>
-#include <Common/logger_useful.h>
+#include <cstdlib>
 
 
 extern const size_t POPULATE_THRESHOLD;
 
 static constexpr size_t MALLOC_MIN_ALIGNMENT = 8;
 
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int CANNOT_ALLOCATE_MEMORY;
-    extern const int LOGICAL_ERROR;
-}
-
-}
-
 /** Previously there was a code which tried to use manual mmap and mremap (clickhouse_mremap.h) for large allocations/reallocations (64MB+).
   * Most modern allocators (including jemalloc) don't use mremap, so the idea was to take advantage from mremap system call for large reallocs.
   * Actually jemalloc had support for mremap, but it was intentionally removed from codebase https://github.com/jemalloc/jemalloc/commit/e2deab7a751c8080c2b2cdcfd7b11887332be1bb.
@@ -69,80 +41,16 @@ class Allocator
 {
 public:
     /// Allocate memory range.
-    void * alloc(size_t size, size_t alignment = 0)
-    {
-        checkSize(size);
-        auto trace = CurrentMemoryTracker::alloc(size);
-        void * ptr = allocNoTrack(size, alignment);
-        trace.onAlloc(ptr, size);
-        return ptr;
-    }
+    void * alloc(size_t size, size_t alignment = 0);
 
     /// Free memory range.
-    void free(void * buf, size_t size)
-    {
-        try
-        {
-            checkSize(size);
-            freeNoTrack(buf);
-            auto trace = CurrentMemoryTracker::free(size);
-            trace.onFree(buf, size);
-        }
-        catch (...)
-        {
-            DB::tryLogCurrentException("Allocator::free");
-            throw;
-        }
-    }
+    void free(void * buf, size_t size);
 
     /** Enlarge memory range.
       * Data from old range is moved to the beginning of new range.
       * Address of memory range could change.
       */
-    void * realloc(void * buf, size_t old_size, size_t new_size, size_t alignment = 0)
-    {
-        checkSize(new_size);
-
-        if (old_size == new_size)
-        {
-            /// nothing to do.
-            /// BTW, it's not possible to change alignment while doing realloc.
-        }
-        else if (alignment <= MALLOC_MIN_ALIGNMENT)
-        {
-            /// Resize malloc'd memory region with no special alignment requirement.
-            auto trace_free = CurrentMemoryTracker::free(old_size);
-            auto trace_alloc = CurrentMemoryTracker::alloc(new_size);
-            trace_free.onFree(buf, old_size);
-
-            void * new_buf = ::realloc(buf, new_size);
-            if (nullptr == new_buf)
-            {
-                DB::throwFromErrno(
-                    fmt::format("Allocator: Cannot realloc from {} to {}.", ReadableSize(old_size), ReadableSize(new_size)), DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY);
-            }
-
-            buf = new_buf;
-            trace_alloc.onAlloc(buf, new_size);
-
-            if constexpr (clear_memory)
-                if (new_size > old_size)
-                    memset(reinterpret_cast<char *>(buf) + old_size, 0, new_size - old_size);
-        }
-        else
-        {
-            /// Big allocs that requires a copy. MemoryTracker is called inside 'alloc', 'free' methods.
-            void * new_buf = alloc(new_size, alignment);
-            memcpy(new_buf, buf, std::min(old_size, new_size));
-            free(buf, old_size);
-            buf = new_buf;
-        }
-
-        if constexpr (populate)
-            prefaultPages(buf, new_size);
-
-        return buf;
-    }
+    void * realloc(void * buf, size_t old_size, size_t new_size, size_t alignment = 0);
 
 protected:
     static constexpr size_t getStackThreshold()
@@ -153,76 +61,6 @@ protected:
     static constexpr bool clear_memory = clear_memory_;
 
 private:
-    void * allocNoTrack(size_t size, size_t alignment)
-    {
-        void * buf;
-        if (alignment <= MALLOC_MIN_ALIGNMENT)
-        {
-            if constexpr (clear_memory)
-                buf = ::calloc(size, 1);
-            else
-                buf = ::malloc(size);
-
-            if (nullptr == buf)
-                DB::throwFromErrno(fmt::format("Allocator: Cannot malloc {}.", ReadableSize(size)), DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY);
-        }
-        else
-        {
-            buf = nullptr;
-            int res = posix_memalign(&buf, alignment, size);
-
-            if (0 != res)
-                DB::throwFromErrno(fmt::format("Cannot allocate memory (posix_memalign) {}.", ReadableSize(size)),
-                    DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY, res);
-
-            if constexpr (clear_memory)
-                memset(buf, 0, size);
-        }
-
-        if constexpr (populate)
-            prefaultPages(buf, size);
-
-        return buf;
-    }
-
-    void freeNoTrack(void * buf)
-    {
-        ::free(buf);
-    }
-
-    void checkSize(size_t size)
-    {
-        /// More obvious exception in case of possible overflow (instead of just "Cannot mmap").
-        if (size >= 0x8000000000000000ULL)
-            throw DB::Exception(DB::ErrorCodes::LOGICAL_ERROR, "Too large size ({}) passed to allocator. It indicates an error.", size);
-    }
-
-    /// Address passed to madvise is required to be aligned to the page boundary.
-    auto adjustToPageSize(void * buf, size_t len, size_t page_size)
-    {
-        const uintptr_t address_numeric = reinterpret_cast<uintptr_t>(buf);
-        const size_t next_page_start = ((address_numeric + page_size - 1) / page_size) * page_size;
-        return std::make_pair(reinterpret_cast<void *>(next_page_start), len - (next_page_start - address_numeric));
-    }
-
-    void prefaultPages([[maybe_unused]] void * buf_, [[maybe_unused]] size_t len_)
-    {
-#if defined(MADV_POPULATE_WRITE)
-        if (len_ < POPULATE_THRESHOLD)
-            return;
-
-        static const size_t page_size = ::getPageSize();
-        if (len_ < page_size) /// Rounded address should be still within [buf, buf + len).
-            return;
-
-        auto [buf, len] = adjustToPageSize(buf_, len_, page_size);
-        if (auto res = ::madvise(buf, len, MADV_POPULATE_WRITE); res < 0)
-            LOG_TRACE(
-                LogFrequencyLimiter(&Poco::Logger::get("Allocator"), 1),
-                "Attempt to populate pages failed: {} (EINVAL is expected for kernels < 5.14)",
-                errnoToString(res));
-#endif
-    }
 };
 
 
diff --git a/src/Common/Arena.h b/src/Common/Arena.h
index 7604091442e..917bef0d6e8 100644
--- a/src/Common/Arena.h
+++ b/src/Common/Arena.h
@@ -8,6 +8,7 @@
 #include <Common/Allocator.h>
 #include <Common/ProfileEvents.h>
 #include <Common/memcpySmall.h>
+#include <base/getPageSize.h>
 
 #if __has_include(<sanitizer/asan_interface.h>) && defined(ADDRESS_SANITIZER)
 #   include <sanitizer/asan_interface.h>
diff --git a/src/Common/ArenaWithFreeLists.h b/src/Common/ArenaWithFreeLists.h
index 76760a20320..80b4a00241d 100644
--- a/src/Common/ArenaWithFreeLists.h
+++ b/src/Common/ArenaWithFreeLists.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <mutex>
 #include <Core/Defines.h>
 #if __has_include(<sanitizer/asan_interface.h>) && defined(ADDRESS_SANITIZER)
 #   include <sanitizer/asan_interface.h>
diff --git a/src/Common/ArrayCache.h b/src/Common/ArrayCache.h
index 79aeddb09df..cb15759e1ba 100644
--- a/src/Common/ArrayCache.h
+++ b/src/Common/ArrayCache.h
@@ -19,11 +19,6 @@
 #include <Common/randomSeed.h>
 #include <Common/formatReadable.h>
 
-/// Required for older Darwin builds, that lack definition of MAP_ANONYMOUS
-#ifndef MAP_ANONYMOUS
-#define MAP_ANONYMOUS MAP_ANON
-#endif
-
 
 namespace DB
 {
@@ -179,13 +174,22 @@ private:
         {
             ptr = mmap(address_hint, size, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
             if (MAP_FAILED == ptr)
-                DB::throwFromErrno(fmt::format("Allocator: Cannot mmap {}.", ReadableSize(size)), DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+                throw DB::ErrnoException(DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Allocator: Cannot mmap {}", ReadableSize(size));
         }
 
         ~Chunk()
         {
             if (ptr && 0 != munmap(ptr, size))
-                DB::throwFromErrno(fmt::format("Allocator: Cannot munmap {}.", ReadableSize(size)), DB::ErrorCodes::CANNOT_MUNMAP);
+            {
+                try
+                {
+                    throw DB::ErrnoException(DB::ErrorCodes::CANNOT_MUNMAP, "Allocator: Cannot munmap {}", ReadableSize(size));
+                }
+                catch (DB::ErrnoException &)
+                {
+                    DB::tryLogCurrentException(__PRETTY_FUNCTION__);
+                }
+            }
         }
 
         Chunk(Chunk && other) noexcept : ptr(other.ptr), size(other.size)
diff --git a/src/Common/AsyncLoader.h b/src/Common/AsyncLoader.h
index 7b6e3ebfefe..95a2273a0f4 100644
--- a/src/Common/AsyncLoader.h
+++ b/src/Common/AsyncLoader.h
@@ -362,7 +362,7 @@ public:
         bool is_executing = false;
     };
 
-    // For introspection and debug only, see `system.async_loader` table.
+    // For introspection and debug only, see `system.asynchronous_loader` table.
     std::vector<JobState> getJobStates() const;
 
     // For deadlock resolution. Should not be used directly.
diff --git a/src/Common/AsynchronousMetrics.cpp b/src/Common/AsynchronousMetrics.cpp
index 36c87010fa5..31cf1962251 100644
--- a/src/Common/AsynchronousMetrics.cpp
+++ b/src/Common/AsynchronousMetrics.cpp
@@ -1,3 +1,4 @@
+#include <Common/formatReadable.h>
 #include <Common/AsynchronousMetrics.h>
 #include <Common/Exception.h>
 #include <Common/setThreadName.h>
@@ -8,6 +9,8 @@
 #include <IO/MMappedFileCache.h>
 #include <IO/ReadHelpers.h>
 #include <base/errnoToString.h>
+#include <base/getPageSize.h>
+#include <sys/resource.h>
 #include <chrono>
 
 #include "config.h"
@@ -655,6 +658,19 @@ void AsynchronousMetrics::update(TimePoint update_time)
             total_memory_tracker.setRSS(rss, free_memory_in_allocator_arenas);
         }
     }
+
+    {
+        struct rusage rusage{};
+        if (!getrusage(RUSAGE_SELF, &rusage))
+        {
+            new_values["MemoryResidentMax"] = { rusage.ru_maxrss * 1024 /* KiB -> bytes */,
+                "Maximum amount of physical memory used by the server process, in bytes." };
+        }
+        else
+        {
+            LOG_ERROR(log, "Cannot obtain resource usage: {}", errnoToString(errno));
+        }
+    }
 #endif
 
 #if defined(OS_LINUX)
@@ -797,7 +813,7 @@ void AsynchronousMetrics::update(TimePoint update_time)
 
             int64_t hz = sysconf(_SC_CLK_TCK);
             if (-1 == hz)
-                throwFromErrno("Cannot call 'sysconf' to obtain system HZ", ErrorCodes::CANNOT_SYSCONF);
+                throw ErrnoException(ErrorCodes::CANNOT_SYSCONF, "Cannot call 'sysconf' to obtain system HZ");
 
             double multiplier = 1.0 / hz / (std::chrono::duration_cast<std::chrono::nanoseconds>(time_after_previous_update).count() / 1e9);
             size_t num_cpus = 0;
diff --git a/src/Common/BitHelpers.h b/src/Common/BitHelpers.h
index 79c612d47e4..bb81d271140 100644
--- a/src/Common/BitHelpers.h
+++ b/src/Common/BitHelpers.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <algorithm>
 #include <cassert>
 #include <concepts>
 #include <cstddef>
diff --git a/src/Common/CalendarTimeInterval.cpp b/src/Common/CalendarTimeInterval.cpp
new file mode 100644
index 00000000000..b218e1d3c7c
--- /dev/null
+++ b/src/Common/CalendarTimeInterval.cpp
@@ -0,0 +1,144 @@
+#include <Common/CalendarTimeInterval.h>
+
+#include <Common/Exception.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+}
+
+CalendarTimeInterval::CalendarTimeInterval(const CalendarTimeInterval::Intervals & intervals)
+{
+    for (auto [kind, val] : intervals)
+    {
+        switch (kind.kind)
+        {
+            case IntervalKind::Nanosecond:
+            case IntervalKind::Microsecond:
+            case IntervalKind::Millisecond:
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Sub-second intervals are not supported here");
+
+            case IntervalKind::Second:
+            case IntervalKind::Minute:
+            case IntervalKind::Hour:
+            case IntervalKind::Day:
+            case IntervalKind::Week:
+                seconds += val * kind.toAvgSeconds();
+                break;
+
+            case IntervalKind::Month:
+                months += val;
+                break;
+            case IntervalKind::Quarter:
+                months += val * 3;
+                break;
+            case IntervalKind::Year:
+                months += val * 12;
+                break;
+        }
+    }
+}
+
+CalendarTimeInterval::Intervals CalendarTimeInterval::toIntervals() const
+{
+    Intervals res;
+    auto greedy = [&](UInt64 x, std::initializer_list<std::pair<IntervalKind, UInt64>> kinds)
+    {
+        for (auto [kind, count] : kinds)
+        {
+            UInt64 k = x / count;
+            if (k == 0)
+                continue;
+            x -= k * count;
+            res.emplace_back(kind, k);
+        }
+        chassert(x == 0);
+    };
+    greedy(months, {{IntervalKind::Year, 12}, {IntervalKind::Month, 1}});
+    greedy(seconds, {{IntervalKind::Week, 3600*24*7}, {IntervalKind::Day, 3600*24}, {IntervalKind::Hour, 3600}, {IntervalKind::Minute, 60}, {IntervalKind::Second, 1}});
+    return res;
+}
+
+UInt64 CalendarTimeInterval::minSeconds() const
+{
+    return 3600*24 * (months/12 * 365 + months%12 * 28) + seconds;
+}
+
+UInt64 CalendarTimeInterval::maxSeconds() const
+{
+    return 3600*24 * (months/12 * 366 + months%12 * 31) + seconds;
+}
+
+void CalendarTimeInterval::assertSingleUnit() const
+{
+    if (seconds && months)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Interval shouldn't contain both calendar units and clock units (e.g. months and days)");
+}
+
+void CalendarTimeInterval::assertPositive() const
+{
+    if (!seconds && !months)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Interval must be positive");
+}
+
+/// Number of whole months between 1970-01-01 and `t`.
+static Int64 toAbsoluteMonth(std::chrono::system_clock::time_point t)
+{
+    std::chrono::year_month_day ymd(std::chrono::floor<std::chrono::days>(t));
+    return (Int64(int(ymd.year())) - 1970) * 12 + Int64(unsigned(ymd.month()) - 1);
+}
+
+static std::chrono::sys_seconds startOfAbsoluteMonth(Int64 absolute_month)
+{
+    Int64 year = absolute_month >= 0 ? absolute_month/12 : -((-absolute_month+11)/12);
+    Int64 month = absolute_month - year*12;
+    chassert(month >= 0 && month < 12);
+    std::chrono::year_month_day ymd(
+        std::chrono::year(int(year + 1970)),
+        std::chrono::month(unsigned(month + 1)),
+        std::chrono::day(1));
+    return std::chrono::sys_days(ymd);
+}
+
+std::chrono::sys_seconds CalendarTimeInterval::advance(std::chrono::system_clock::time_point tp) const
+{
+    auto t = std::chrono::sys_seconds(std::chrono::floor<std::chrono::seconds>(tp));
+    if (months)
+    {
+        auto m = toAbsoluteMonth(t);
+        auto s = t - startOfAbsoluteMonth(m);
+        t = startOfAbsoluteMonth(m + Int64(months)) + s;
+    }
+    return t + std::chrono::seconds(Int64(seconds));
+}
+
+std::chrono::sys_seconds CalendarTimeInterval::floor(std::chrono::system_clock::time_point tp) const
+{
+    assertSingleUnit();
+    assertPositive();
+
+    if (months)
+        return startOfAbsoluteMonth(toAbsoluteMonth(tp) / months * months);
+    else
+    {
+        constexpr std::chrono::seconds epoch(-3600*24*3);
+        auto t = std::chrono::sys_seconds(std::chrono::floor<std::chrono::seconds>(tp));
+        /// We want to align with weeks, but 1970-01-01 is a Thursday, so align with 1969-12-29 instead.
+        return std::chrono::sys_seconds((t.time_since_epoch() - epoch) / seconds * seconds + epoch);
+    }
+}
+
+bool CalendarTimeInterval::operator==(const CalendarTimeInterval & rhs) const
+{
+    return std::tie(months, seconds) == std::tie(rhs.months, rhs.seconds);
+}
+
+bool CalendarTimeInterval::operator!=(const CalendarTimeInterval & rhs) const
+{
+    return !(*this == rhs);
+}
+
+}
diff --git a/src/Common/CalendarTimeInterval.h b/src/Common/CalendarTimeInterval.h
new file mode 100644
index 00000000000..d5acc6ee2f2
--- /dev/null
+++ b/src/Common/CalendarTimeInterval.h
@@ -0,0 +1,63 @@
+#pragma once
+
+#include <Common/IntervalKind.h>
+#include <chrono>
+
+namespace DB
+{
+
+/// Represents a duration of calendar time, e.g.:
+///  * 2 weeks + 5 minutes + and 21 seconds (aka 605121 seconds),
+///  * 1 (calendar) month - not equivalent to any number of seconds!
+///  * 3 years + 2 weeks (aka 36 months + 604800 seconds).
+///
+/// Be careful with calendar arithmetic: it's missing many familiar properties of numbers.
+/// E.g. x + y - y is not always equal to x (October 31 + 1 month - 1 month = November 1).
+struct CalendarTimeInterval
+{
+    UInt64 seconds = 0;
+    UInt64 months = 0;
+
+    using Intervals = std::vector<std::pair<IntervalKind, UInt64>>;
+
+    CalendarTimeInterval() = default;
+
+    /// Year, Quarter, Month are converted to months.
+    /// Week, Day, Hour, Minute, Second are converted to seconds.
+    /// Millisecond, Microsecond, Nanosecond throw exception.
+    explicit CalendarTimeInterval(const Intervals & intervals);
+
+    /// E.g. for {36 months, 604801 seconds} returns {3 years, 2 weeks, 1 second}.
+    Intervals toIntervals() const;
+
+    /// Approximate shortest and longest duration in seconds. E.g. a month is [28, 31] days.
+    UInt64 minSeconds() const;
+    UInt64 maxSeconds() const;
+
+    /// Checks that the interval has only months or only seconds, throws otherwise.
+    void assertSingleUnit() const;
+    void assertPositive() const;
+
+    /// Add this interval to the timestamp. First months, then seconds.
+    /// Gets weird near month boundaries: October 31 + 1 month = December 1.
+    std::chrono::sys_seconds advance(std::chrono::system_clock::time_point t) const;
+
+    /// Rounds the timestamp down to the nearest timestamp "aligned" with this interval.
+    /// The interval must satisfy assertSingleUnit() and assertPositive().
+    ///  * For months, rounds to the start of a month whose abosolute index is divisible by `months`.
+    ///    The month index is 0-based starting from January 1970.
+    ///    E.g. if the interval is 1 month, rounds down to the start of the month.
+    ///  * For seconds, rounds to a timestamp x such that (x - December 29 1969 (Monday)) is divisible
+    ///    by this interval.
+    ///    E.g. if the interval is 1 week, rounds down to the start of the week (Monday).
+    ///
+    /// Guarantees:
+    ///  * advance(floor(x)) > x
+    ///  * floor(advance(floor(x))) = advance(floor(x))
+    std::chrono::sys_seconds floor(std::chrono::system_clock::time_point t) const;
+
+    bool operator==(const CalendarTimeInterval & rhs) const;
+    bool operator!=(const CalendarTimeInterval & rhs) const;
+};
+
+}
diff --git a/src/Common/ColumnsHashingImpl.h b/src/Common/ColumnsHashingImpl.h
index 3240510ea9b..7116160e94c 100644
--- a/src/Common/ColumnsHashingImpl.h
+++ b/src/Common/ColumnsHashingImpl.h
@@ -31,6 +31,17 @@ public:
 
 using HashMethodContextPtr = std::shared_ptr<HashMethodContext>;
 
+struct LastElementCacheStats
+{
+    UInt64 hits = 0;
+    UInt64 misses = 0;
+
+    void update(size_t num_tries, size_t num_misses)
+    {
+        hits += num_tries - num_misses;
+        misses += num_misses;
+    }
+};
 
 namespace columns_hashing_impl
 {
@@ -39,14 +50,19 @@ template <typename Value, bool consecutive_keys_optimization_>
 struct LastElementCache
 {
     static constexpr bool consecutive_keys_optimization = consecutive_keys_optimization_;
+
     Value value;
     bool empty = true;
     bool found = false;
+    UInt64 misses = 0;
 
-    bool check(const Value & value_) { return !empty && value == value_; }
+    bool check(const Value & value_) const { return value == value_; }
 
     template <typename Key>
-    bool check(const Key & key) { return !empty && value.first == key; }
+    bool check(const Key & key) const { return value.first == key; }
+
+    bool hasOnlyOneValue() const { return found && misses == 1; }
+    UInt64 getMisses() const { return misses; }
 };
 
 template <typename Data>
@@ -166,6 +182,7 @@ public:
                     return EmplaceResult(!has_null_key);
             }
         }
+
         auto key_holder = static_cast<Derived &>(*this).getKeyHolder(row, pool);
         return emplaceImpl(key_holder, data);
     }
@@ -183,6 +200,7 @@ public:
                     return FindResult(data.hasNullKeyData(), 0);
             }
         }
+
         auto key_holder = static_cast<Derived &>(*this).getKeyHolder(row, pool);
         return findKeyImpl(keyHolderGetKey(key_holder), data);
     }
@@ -194,6 +212,30 @@ public:
         return data.hash(keyHolderGetKey(key_holder));
     }
 
+    ALWAYS_INLINE void resetCache()
+    {
+        if constexpr (consecutive_keys_optimization)
+        {
+            cache.empty = true;
+            cache.found = false;
+            cache.misses = 0;
+        }
+    }
+
+    ALWAYS_INLINE bool hasOnlyOneValueSinceLastReset() const
+    {
+        if constexpr (consecutive_keys_optimization)
+            return cache.hasOnlyOneValue();
+        return false;
+    }
+
+    ALWAYS_INLINE UInt64 getCacheMissesSinceLastReset() const
+    {
+        if constexpr (consecutive_keys_optimization)
+            return cache.getMisses();
+        return 0;
+    }
+
     ALWAYS_INLINE bool isNullAt(size_t row) const
     {
         if constexpr (nullable)
@@ -225,17 +267,15 @@ protected:
             else
                 cache.value = Value();
         }
-        if constexpr (nullable)
-        {
 
+        if constexpr (nullable)
             null_map = &checkAndGetColumn<ColumnNullable>(column)->getNullMapColumn();
-        }
     }
 
     template <typename Data, typename KeyHolder>
     ALWAYS_INLINE EmplaceResult emplaceImpl(KeyHolder & key_holder, Data & data)
     {
-        if constexpr (Cache::consecutive_keys_optimization)
+        if constexpr (consecutive_keys_optimization)
         {
             if (cache.found && cache.check(keyHolderGetKey(key_holder)))
             {
@@ -266,6 +306,7 @@ protected:
         {
             cache.found = true;
             cache.empty = false;
+            ++cache.misses;
 
             if constexpr (has_mapped)
             {
@@ -288,12 +329,12 @@ protected:
     template <typename Data, typename Key>
     ALWAYS_INLINE FindResult findKeyImpl(Key key, Data & data)
     {
-        if constexpr (Cache::consecutive_keys_optimization)
+        if constexpr (consecutive_keys_optimization)
         {
             /// It's possible to support such combination, but code will became more complex.
             /// Now there's not place where we need this options enabled together
             static_assert(!FindResult::has_offset, "`consecutive_keys_optimization` and `has_offset` are conflicting options");
-            if (cache.check(key))
+            if (likely(!cache.empty) && cache.check(key))
             {
                 if constexpr (has_mapped)
                     return FindResult(&cache.value.second, cache.found, 0);
@@ -308,6 +349,7 @@ protected:
         {
             cache.found = it != nullptr;
             cache.empty = false;
+            ++cache.misses;
 
             if constexpr (has_mapped)
             {
@@ -325,9 +367,8 @@ protected:
 
         size_t offset = 0;
         if constexpr (FindResult::has_offset)
-        {
             offset = it ? data.offsetInternal(it) : 0;
-        }
+
         if constexpr (has_mapped)
             return FindResult(it ? &it->getMapped() : nullptr, it != nullptr, offset);
         else
diff --git a/src/Common/Config/ConfigProcessor.cpp b/src/Common/Config/ConfigProcessor.cpp
index c213b7257d9..92e66fee489 100644
--- a/src/Common/Config/ConfigProcessor.cpp
+++ b/src/Common/Config/ConfigProcessor.cpp
@@ -519,8 +519,9 @@ void ConfigProcessor::doIncludesRecursive(
 
     if (attr_nodes["from_zk"]) /// we have zookeeper subst
     {
-        if (node->hasChildNodes()) /// only allow substitution for nodes with no value
-            throw Poco::Exception("Element <" + node->nodeName() + "> has value, can't process from_zk substitution");
+        /// only allow substitution for nodes with no value and without "replace"
+        if (node->hasChildNodes() && !replace)
+            throw Poco::Exception("Element <" + node->nodeName() + "> has value and does not have 'replace' attribute, can't process from_zk substitution");
 
         contributing_zk_paths.insert(attr_nodes["from_zk"]->getNodeValue());
 
@@ -544,8 +545,9 @@ void ConfigProcessor::doIncludesRecursive(
 
     if (attr_nodes["from_env"]) /// we have env subst
     {
-        if (node->hasChildNodes()) /// only allow substitution for nodes with no value
-            throw Poco::Exception("Element <" + node->nodeName() + "> has value, can't process from_env substitution");
+        /// only allow substitution for nodes with no value and without "replace"
+        if (node->hasChildNodes() && !replace)
+            throw Poco::Exception("Element <" + node->nodeName() + "> has value and does not have 'replace' attribute, can't process from_env substitution");
 
         XMLDocumentPtr env_document;
         auto get_env_node = [&](const std::string & name) -> const Node *
diff --git a/src/Common/CounterInFile.h b/src/Common/CounterInFile.h
index fe3b74173f6..854bf7cc675 100644
--- a/src/Common/CounterInFile.h
+++ b/src/Common/CounterInFile.h
@@ -69,13 +69,13 @@ public:
 
         int fd = ::open(path.c_str(), O_RDWR | O_CREAT | O_CLOEXEC, 0666);
         if (-1 == fd)
-            DB::throwFromErrnoWithPath("Cannot open file " + path, path, DB::ErrorCodes::CANNOT_OPEN_FILE);
+            DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_OPEN_FILE, path, "Cannot open file {}", path);
 
         try
         {
             int flock_ret = flock(fd, LOCK_EX);
             if (-1 == flock_ret)
-                DB::throwFromErrnoWithPath("Cannot lock file " + path, path, DB::ErrorCodes::CANNOT_OPEN_FILE);
+                DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_OPEN_FILE, path, "Cannot lock file {}", path);
 
             if (!file_doesnt_exists)
             {
@@ -88,7 +88,7 @@ public:
                 {
                     /// A more understandable error message.
                     if (e.code() == DB::ErrorCodes::CANNOT_READ_ALL_DATA || e.code() == DB::ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF)
-                        throw DB::ParsingException(e.code(), "File {} is empty. You must fill it manually with appropriate value.", path);
+                        throw DB::Exception(e.code(), "File {} is empty. You must fill it manually with appropriate value.", path);
                     else
                         throw;
                 }
@@ -145,7 +145,7 @@ public:
 
         int fd = ::open(path.c_str(), O_RDWR | O_CREAT | O_CLOEXEC, 0666);
         if (-1 == fd)
-            DB::throwFromErrnoWithPath("Cannot open file " + path, path, DB::ErrorCodes::CANNOT_OPEN_FILE);
+            DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_OPEN_FILE, path, "Cannot open file {}", path);
 
         try
         {
diff --git a/src/Common/CurrentMetrics.cpp b/src/Common/CurrentMetrics.cpp
index 1a7232012da..2613e9ec116 100644
--- a/src/Common/CurrentMetrics.cpp
+++ b/src/Common/CurrentMetrics.cpp
@@ -212,6 +212,8 @@
     M(PartsCommitted, "Deprecated. See PartsActive.") \
     M(PartsPreActive, "The part is in data_parts, but not used for SELECTs.") \
     M(PartsActive, "Active data part, used by current and upcoming SELECTs.") \
+    M(AttachedDatabase, "Active database, used by current and upcoming SELECTs.") \
+    M(AttachedTable, "Active table, used by current and upcoming SELECTs.") \
     M(PartsOutdated, "Not active data part, but could be used by only current SELECTs, could be deleted after SELECTs finishes.") \
     M(PartsDeleting, "Not active data part with identity refcounter, it is deleting right now by a cleaner.") \
     M(PartsDeleteOnDestroy, "Part was moved to another disk and should be deleted in own destructor.") \
@@ -251,6 +253,8 @@
     M(MergeTreeAllRangesAnnouncementsSent, "The current number of announcement being sent in flight from the remote server to the initiator server about the set of data parts (for MergeTree tables). Measured on the remote server side.") \
     M(CreatedTimersInQueryProfiler, "Number of Created thread local timers in QueryProfiler") \
     M(ActiveTimersInQueryProfiler, "Number of Active thread local timers in QueryProfiler") \
+    M(RefreshableViews, "Number materialized views with periodic refreshing (REFRESH)") \
+    M(RefreshingViews, "Number of materialized views currently executing a refresh") \
 
 #ifdef APPLY_FOR_EXTERNAL_METRICS
     #define APPLY_FOR_METRICS(M) APPLY_FOR_BUILTIN_METRICS(M) APPLY_FOR_EXTERNAL_METRICS(M)
@@ -258,6 +262,7 @@
     #define APPLY_FOR_METRICS(M) APPLY_FOR_BUILTIN_METRICS(M)
 #endif
 
+
 namespace CurrentMetrics
 {
     #define M(NAME, DOCUMENTATION) extern const Metric NAME = Metric(__COUNTER__);
diff --git a/src/Common/Epoll.cpp b/src/Common/Epoll.cpp
index ac06f044beb..49c86222cf0 100644
--- a/src/Common/Epoll.cpp
+++ b/src/Common/Epoll.cpp
@@ -19,7 +19,7 @@ Epoll::Epoll() : events_count(0)
 {
     epoll_fd = epoll_create1(0);
     if (epoll_fd == -1)
-        throwFromErrno("Cannot open epoll descriptor", DB::ErrorCodes::EPOLL_ERROR);
+        throw DB::ErrnoException(DB::ErrorCodes::EPOLL_ERROR, "Cannot open epoll descriptor");
 }
 
 Epoll::Epoll(Epoll && other) noexcept : epoll_fd(other.epoll_fd), events_count(other.events_count.load())
@@ -47,7 +47,7 @@ void Epoll::add(int fd, void * ptr, uint32_t events)
     ++events_count;
 
     if (epoll_ctl(epoll_fd, EPOLL_CTL_ADD, fd, &event) == -1)
-        throwFromErrno("Cannot add new descriptor to epoll", DB::ErrorCodes::EPOLL_ERROR);
+        throw DB::ErrnoException(DB::ErrorCodes::EPOLL_ERROR, "Cannot add new descriptor to epoll");
 }
 
 void Epoll::remove(int fd)
@@ -55,7 +55,7 @@ void Epoll::remove(int fd)
     --events_count;
 
     if (epoll_ctl(epoll_fd, EPOLL_CTL_DEL, fd, nullptr) == -1)
-        throwFromErrno("Cannot remove descriptor from epoll", DB::ErrorCodes::EPOLL_ERROR);
+        throw DB::ErrnoException(DB::ErrorCodes::EPOLL_ERROR, "Cannot remove descriptor from epoll");
 }
 
 size_t Epoll::getManyReady(int max_events, epoll_event * events_out, int timeout) const
@@ -82,7 +82,7 @@ size_t Epoll::getManyReady(int max_events, epoll_event * events_out, int timeout
                 continue;
             }
             else
-                throwFromErrno("Error in epoll_wait", DB::ErrorCodes::EPOLL_ERROR);
+                throw DB::ErrnoException(DB::ErrorCodes::EPOLL_ERROR, "Error in epoll_wait");
         }
         else
             break;
diff --git a/src/Common/EventFD.cpp b/src/Common/EventFD.cpp
index af50ca62271..9ec7f128420 100644
--- a/src/Common/EventFD.cpp
+++ b/src/Common/EventFD.cpp
@@ -21,7 +21,7 @@ EventFD::EventFD()
 {
     fd = eventfd(0 /* initval */, 0 /* flags */);
     if (fd == -1)
-        throwFromErrno("Cannot create eventfd", ErrorCodes::CANNOT_PIPE);
+        throw ErrnoException(ErrorCodes::CANNOT_PIPE, "Cannot create eventfd");
 }
 
 uint64_t EventFD::read() const
@@ -33,7 +33,7 @@ uint64_t EventFD::read() const
             break;
 
         if (errno != EINTR)
-            throwFromErrno("Cannot read from eventfd", ErrorCodes::CANNOT_READ_FROM_SOCKET);
+            throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_SOCKET, "Cannot read from eventfd");
     }
 
     return buf;
@@ -47,7 +47,7 @@ bool EventFD::write(uint64_t increase) const
             return false;
 
         if (errno != EINTR)
-            throwFromErrno("Cannot write to eventfd", ErrorCodes::CANNOT_WRITE_TO_SOCKET);
+            throw ErrnoException(ErrorCodes::CANNOT_WRITE_TO_SOCKET, "Cannot write to eventfd");
     }
 
     return true;
diff --git a/src/Common/Exception.cpp b/src/Common/Exception.cpp
index ed9fb00241d..e1f010cc740 100644
--- a/src/Common/Exception.cpp
+++ b/src/Common/Exception.cpp
@@ -1,25 +1,24 @@
 #include "Exception.h"
 
 #include <algorithm>
-#include <cstring>
-#include <cxxabi.h>
 #include <cstdlib>
-#include <Poco/String.h>
-#include <Common/logger_useful.h>
-#include <IO/WriteHelpers.h>
-#include <IO/ReadHelpers.h>
+#include <cstring>
+#include <filesystem>
+#include <cxxabi.h>
 #include <IO/Operators.h>
-#include <IO/ReadBufferFromString.h>
 #include <IO/ReadBufferFromFile.h>
+#include <IO/ReadBufferFromString.h>
+#include <IO/ReadHelpers.h>
+#include <IO/WriteHelpers.h>
 #include <base/demangle.h>
-#include <base/errnoToString.h>
-#include <Common/formatReadable.h>
-#include <Common/filesystemHelpers.h>
+#include <Poco/String.h>
 #include <Common/ErrorCodes.h>
+#include <Common/LockMemoryExceptionInThread.h>
 #include <Common/MemorySanitizer.h>
 #include <Common/SensitiveDataMasker.h>
-#include <Common/LockMemoryExceptionInThread.h>
-#include <filesystem>
+#include <Common/filesystemHelpers.h>
+#include <Common/formatReadable.h>
+#include <Common/logger_useful.h>
 
 #include <Common/config_version.h>
 
@@ -212,17 +211,6 @@ Exception::FramePointers Exception::getStackFramePointers() const
 thread_local bool Exception::enable_job_stack_trace = false;
 thread_local std::vector<StackTrace::FramePointers> Exception::thread_frame_pointers = {};
 
-
-void throwFromErrno(const std::string & s, int code, int the_errno)
-{
-    throw ErrnoException(s + ", " + errnoToString(the_errno), code, the_errno);
-}
-
-void throwFromErrnoWithPath(const std::string & s, const std::string & path, int code, int the_errno)
-{
-    throw ErrnoException(s + ", " + errnoToString(the_errno), code, the_errno, path);
-}
-
 static void tryLogCurrentExceptionImpl(Poco::Logger * logger, const std::string & start_of_message)
 {
     try
@@ -628,48 +616,4 @@ ExecutionStatus ExecutionStatus::fromText(const std::string & data)
     return status;
 }
 
-ParsingException::ParsingException() = default;
-ParsingException::ParsingException(const std::string & msg, int code)
-    : Exception(msg, code)
-{
-}
-
-/// We use additional field formatted_message_ to make this method const.
-std::string ParsingException::displayText() const
-{
-    try
-    {
-        formatted_message = message();
-        bool need_newline = false;
-        if (!file_name.empty())
-        {
-            formatted_message += fmt::format(": (in file/uri {})", file_name);
-            need_newline = true;
-        }
-
-        if (line_number != -1)
-        {
-            formatted_message += fmt::format(": (at row {})", line_number);
-            need_newline = true;
-        }
-
-        if (need_newline)
-            formatted_message += "\n";
-    }
-    catch (...) {} // NOLINT(bugprone-empty-catch)
-
-    if (!formatted_message.empty())
-    {
-        std::string result = name();
-        result.append(": ");
-        result.append(formatted_message);
-        return result;
-    }
-    else
-    {
-        return Exception::displayText();
-    }
-}
-
-
 }
diff --git a/src/Common/Exception.h b/src/Common/Exception.h
index ac116f5ceca..6f30fde3876 100644
--- a/src/Common/Exception.h
+++ b/src/Common/Exception.h
@@ -7,9 +7,10 @@
 #include <Poco/Exception.h>
 
 #include <base/defines.h>
+#include <base/errnoToString.h>
 #include <base/scope_guard.h>
-#include <Common/StackTrace.h>
 #include <Common/LoggingFormatStringHelpers.h>
+#include <Common/StackTrace.h>
 
 #include <fmt/format.h>
 
@@ -92,15 +93,6 @@ public:
         return Exception(msg, code, remote_);
     }
 
-    /// Message must be a compile-time constant
-    template <typename T>
-    requires std::is_convertible_v<T, String>
-    Exception(int code, T && message) : Exception(message, code)
-    {
-        capture_thread_frame_pointers = thread_frame_pointers;
-        message_format_string = tryGetStaticFormatString(message);
-    }
-
     /// These creators are for messages that were received by network or generated by a third-party library in runtime.
     /// Please use a constructor for all other cases.
     static Exception createRuntime(int code, const String & message) { return Exception(message, code); }
@@ -173,12 +165,61 @@ std::string getExceptionStackTraceString(const std::exception & e);
 std::string getExceptionStackTraceString(std::exception_ptr e);
 
 
-/// Contains an additional member `saved_errno`. See the throwFromErrno function.
+/// Contains an additional member `saved_errno`
 class ErrnoException : public Exception
 {
 public:
-    ErrnoException(const std::string & msg, int code, int saved_errno_, const std::optional<std::string> & path_ = {})
-        : Exception(msg, code), saved_errno(saved_errno_), path(path_) {}
+    ErrnoException(std::string && msg, int code, int with_errno) : Exception(msg, code), saved_errno(with_errno)
+    {
+        capture_thread_frame_pointers = thread_frame_pointers;
+        addMessage(", {}", errnoToString(saved_errno));
+    }
+
+    /// Message must be a compile-time constant
+    template <typename T>
+    requires std::is_convertible_v<T, String>
+    ErrnoException(int code, T && message) : Exception(message, code), saved_errno(errno)
+    {
+        capture_thread_frame_pointers = thread_frame_pointers;
+        addMessage(", {}", errnoToString(saved_errno));
+    }
+
+    // Format message with fmt::format, like the logging functions.
+    template <typename... Args>
+    ErrnoException(int code, FormatStringHelper<Args...> fmt, Args &&... args)
+        : Exception(fmt::format(fmt.fmt_str, std::forward<Args>(args)...), code), saved_errno(errno)
+    {
+        capture_thread_frame_pointers = thread_frame_pointers;
+        message_format_string = fmt.message_format_string;
+        addMessage(", {}", errnoToString(saved_errno));
+    }
+
+    template <typename... Args>
+    [[noreturn]] static void throwWithErrno(int code, int with_errno, FormatStringHelper<Args...> fmt, Args &&... args)
+    {
+        auto e = ErrnoException(fmt::format(fmt.fmt_str, std::forward<Args>(args)...), code, with_errno);
+        e.message_format_string = fmt.message_format_string;
+        throw e;
+    }
+
+    template <typename... Args>
+    [[noreturn]] static void throwFromPath(int code, const std::string & path, FormatStringHelper<Args...> fmt, Args &&... args)
+    {
+        auto e = ErrnoException(fmt::format(fmt.fmt_str, std::forward<Args>(args)...), code, errno);
+        e.message_format_string = fmt.message_format_string;
+        e.path = path;
+        throw e;
+    }
+
+    template <typename... Args>
+    [[noreturn]] static void
+    throwFromPathWithErrno(int code, const std::string & path, int with_errno, FormatStringHelper<Args...> fmt, Args &&... args)
+    {
+        auto e = ErrnoException(fmt::format(fmt.fmt_str, std::forward<Args>(args)...), code, with_errno);
+        e.message_format_string = fmt.message_format_string;
+        e.path = path;
+        throw e;
+    }
 
     ErrnoException * clone() const override { return new ErrnoException(*this); }
     void rethrow() const override { throw *this; } // NOLINT
@@ -188,58 +229,14 @@ public:
 
 private:
     int saved_errno;
-    std::optional<std::string> path;
+    std::optional<std::string> path{};
 
     const char * name() const noexcept override { return "DB::ErrnoException"; }
     const char * className() const noexcept override { return "DB::ErrnoException"; }
 };
 
-
-/// Special class of exceptions, used mostly in ParallelParsingInputFormat for
-/// more convenient calculation of problem line number.
-class ParsingException : public Exception
-{
-    ParsingException(const std::string & msg, int code);
-public:
-    ParsingException();
-
-    // Format message with fmt::format, like the logging functions.
-    template <typename... Args>
-    ParsingException(int code, FormatStringHelper<Args...> fmt, Args &&... args) : Exception(fmt::format(fmt.fmt_str, std::forward<Args>(args)...), code)
-    {
-        message_format_string = fmt.message_format_string;
-    }
-
-    std::string displayText() const override;
-
-    ssize_t getLineNumber() const { return line_number; }
-    void setLineNumber(int line_number_) { line_number = line_number_;}
-
-    String getFileName() const { return file_name; }
-    void setFileName(const String & file_name_) { file_name = file_name_; }
-
-    Exception * clone() const override { return new ParsingException(*this); }
-    void rethrow() const override { throw *this; } // NOLINT
-
-private:
-    ssize_t line_number{-1};
-    String file_name;
-    mutable std::string formatted_message;
-
-    const char * name() const noexcept override { return "DB::ParsingException"; }
-    const char * className() const noexcept override { return "DB::ParsingException"; }
-};
-
-
 using Exceptions = std::vector<std::exception_ptr>;
 
-
-[[noreturn]] void throwFromErrno(const std::string & s, int code, int the_errno = errno);
-/// Useful to produce some extra information about available space and inodes on device
-[[noreturn]] void throwFromErrnoWithPath(const std::string & s, const std::string & path, int code,
-                                         int the_errno = errno);
-
-
 /** Try to write an exception to the log (and forget about it).
   * Can be used in destructors in the catch-all block.
   */
diff --git a/src/Common/FailPoint.cpp b/src/Common/FailPoint.cpp
index 75ea9893f66..9665788dac2 100644
--- a/src/Common/FailPoint.cpp
+++ b/src/Common/FailPoint.cpp
@@ -28,13 +28,14 @@ static struct InitFiu
 
 /// We should define different types of failpoints here. There are four types of them:
 /// - ONCE: the failpoint will only be triggered once.
-/// - REGULAR: the failpoint will always be triggered util disableFailPoint is called.
-/// - PAUSAEBLE_ONCE: the failpoint will be blocked one time when pauseFailPoint is called, util disableFailPoint is called.
-/// - PAUSAEBLE: the failpoint will be blocked every time when pauseFailPoint is called, util disableFailPoint is called.
+/// - REGULAR: the failpoint will always be triggered until disableFailPoint is called.
+/// - PAUSEABLE_ONCE: the failpoint will be blocked one time when pauseFailPoint is called, util disableFailPoint is called.
+/// - PAUSEABLE: the failpoint will be blocked every time when pauseFailPoint is called, util disableFailPoint is called.
 
 #define APPLY_FOR_FAILPOINTS(ONCE, REGULAR, PAUSEABLE_ONCE, PAUSEABLE) \
     ONCE(replicated_merge_tree_commit_zk_fail_after_op) \
     ONCE(replicated_merge_tree_insert_quorum_fail_0) \
+    REGULAR(replicated_merge_tree_commit_zk_fail_when_recovering_from_hw_fault) \
     REGULAR(use_delayed_remote_source) \
     REGULAR(cluster_discovery_faults) \
     REGULAR(check_table_query_delay_for_part) \
diff --git a/src/Common/FiberStack.h b/src/Common/FiberStack.h
index 91bb632d807..9d135f27306 100644
--- a/src/Common/FiberStack.h
+++ b/src/Common/FiberStack.h
@@ -13,6 +13,11 @@
 #include <valgrind/valgrind.h>
 #endif
 
+/// Required for older Darwin builds, that lack definition of MAP_ANONYMOUS
+#ifndef MAP_ANONYMOUS
+#define MAP_ANONYMOUS MAP_ANON
+#endif
+
 namespace DB::ErrorCodes
 {
     extern const int CANNOT_ALLOCATE_MEMORY;
@@ -46,14 +51,14 @@ public:
 
         void * vp = ::mmap(nullptr, num_bytes, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
         if (MAP_FAILED == vp)
-            DB::throwFromErrno(fmt::format("FiberStack: Cannot mmap {}.", ReadableSize(num_bytes)), DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+            throw DB::ErrnoException(DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY, "FiberStack: Cannot mmap {}.", ReadableSize(num_bytes));
 
         /// TODO: make reports on illegal guard page access more clear.
         /// Currently we will see segfault and almost random stacktrace.
         if (-1 == ::mprotect(vp, page_size, PROT_NONE))
         {
             ::munmap(vp, num_bytes);
-            DB::throwFromErrno("FiberStack: cannot protect guard page", DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+            throw DB::ErrnoException(DB::ErrorCodes::CANNOT_ALLOCATE_MEMORY, "FiberStack: cannot protect guard page");
         }
 
         /// Do not count guard page in memory usage.
diff --git a/src/Common/FieldVisitorToString.cpp b/src/Common/FieldVisitorToString.cpp
index 60834afab35..c4cb4266418 100644
--- a/src/Common/FieldVisitorToString.cpp
+++ b/src/Common/FieldVisitorToString.cpp
@@ -18,16 +18,37 @@ template <typename T>
 static inline String formatQuoted(T x)
 {
     WriteBufferFromOwnString wb;
-    writeQuoted(x, wb);
-    return wb.str();
-}
 
-template <typename T>
-static inline void writeQuoted(const DecimalField<T> & x, WriteBuffer & buf)
-{
-    writeChar('\'', buf);
-    writeText(x.getValue(), x.getScale(), buf, {});
-    writeChar('\'', buf);
+    if constexpr (is_decimal_field<T>)
+    {
+        writeChar('\'', wb);
+        writeText(x.getValue(), x.getScale(), wb, {});
+        writeChar('\'', wb);
+    }
+    else if constexpr (is_big_int_v<T>)
+    {
+        writeChar('\'', wb);
+        writeText(x, wb);
+        writeChar('\'', wb);
+    }
+    else
+    {
+        /// While `writeQuoted` sounds like it will always write the value in quotes,
+        /// in fact it means: write according to the rules of the quoted format, like VALUES,
+        /// where strings, dates, date-times, UUID are in quotes, and numbers are not.
+
+        /// That's why we take extra care to put Decimal and big integers inside quotes
+        /// when formatting literals in SQL language,
+        /// because it is different from the quoted formats like VALUES.
+
+        /// In fact, there are no Decimal and big integer literals in SQL,
+        /// but they can appear if we format the query from a modified AST.
+
+        /// We can fix this idiosyncrasy later.
+
+        writeQuoted(x, wb);
+    }
+    return wb.str();
 }
 
 /** In contrast to writeFloatText (and writeQuoted),
diff --git a/src/Common/InterruptListener.h b/src/Common/InterruptListener.h
index b8b2ba6be7d..1f0f021fb03 100644
--- a/src/Common/InterruptListener.h
+++ b/src/Common/InterruptListener.h
@@ -58,9 +58,8 @@ private:
 public:
     InterruptListener() : active(false)
     {
-        if (sigemptyset(&sig_set)
-            || sigaddset(&sig_set, SIGINT))
-            throwFromErrno("Cannot manipulate with signal set.", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+        if (sigemptyset(&sig_set) || sigaddset(&sig_set, SIGINT))
+            throw ErrnoException(ErrorCodes::CANNOT_MANIPULATE_SIGSET, "Cannot manipulate with signal set");
 
         block();
     }
@@ -82,7 +81,7 @@ public:
             if (errno == EAGAIN)
                 return false;
             else
-                throwFromErrno("Cannot poll signal (sigtimedwait).", ErrorCodes::CANNOT_WAIT_FOR_SIGNAL);
+                throw ErrnoException(ErrorCodes::CANNOT_WAIT_FOR_SIGNAL, "Cannot poll signal (sigtimedwait)");
         }
 
         return true;
@@ -93,7 +92,7 @@ public:
         if (!active)
         {
             if (pthread_sigmask(SIG_BLOCK, &sig_set, nullptr))
-                throwFromErrno("Cannot block signal.", ErrorCodes::CANNOT_BLOCK_SIGNAL);
+                throw ErrnoException(ErrorCodes::CANNOT_BLOCK_SIGNAL, "Cannot block signal");
 
             active = true;
         }
@@ -105,7 +104,7 @@ public:
         if (active)
         {
             if (pthread_sigmask(SIG_UNBLOCK, &sig_set, nullptr))
-                throwFromErrno("Cannot unblock signal.", ErrorCodes::CANNOT_UNBLOCK_SIGNAL);
+                throw ErrnoException(ErrorCodes::CANNOT_UNBLOCK_SIGNAL, "Cannot unblock signal");
 
             active = false;
         }
diff --git a/src/Common/IntervalKind.h b/src/Common/IntervalKind.h
index 6893286f196..0f45d0ac169 100644
--- a/src/Common/IntervalKind.h
+++ b/src/Common/IntervalKind.h
@@ -71,6 +71,8 @@ struct IntervalKind
     /// Returns false if the conversion did not succeed.
     /// For example, `IntervalKind::tryParseString('second', result)` returns `result` equals `IntervalKind::Kind::Second`.
     static bool tryParseString(const std::string & kind, IntervalKind::Kind & result);
+
+    auto operator<=>(const IntervalKind & other) const { return kind <=> other.kind; }
 };
 
 /// NOLINTNEXTLINE
diff --git a/src/Common/Macros.cpp b/src/Common/Macros.cpp
index 891aa53c061..0035e7abfe8 100644
--- a/src/Common/Macros.cpp
+++ b/src/Common/Macros.cpp
@@ -120,7 +120,7 @@ String Macros::expand(const String & s,
             auto uuid = ServerUUID::get();
             if (UUIDHelpers::Nil == uuid)
                 throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                    "Macro {server_uuid} expanded to zero, which means the UUID is not initialized (most likely it's not a server application)");
+                    "Macro {{server_uuid}} expanded to zero, which means the UUID is not initialized (most likely it's not a server application)");
             res += toString(uuid);
             info.expanded_other = true;
         }
diff --git a/src/Common/MemoryStatisticsOS.cpp b/src/Common/MemoryStatisticsOS.cpp
index f2d2ab5fea9..2092c679336 100644
--- a/src/Common/MemoryStatisticsOS.cpp
+++ b/src/Common/MemoryStatisticsOS.cpp
@@ -39,7 +39,8 @@ MemoryStatisticsOS::MemoryStatisticsOS()
     fd = ::open(filename, O_RDONLY | O_CLOEXEC);
 
     if (-1 == fd)
-        throwFromErrno("Cannot open file " + std::string(filename), errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, filename, "Cannot open file {}", filename);
 }
 
 MemoryStatisticsOS::~MemoryStatisticsOS()
@@ -48,9 +49,8 @@ MemoryStatisticsOS::~MemoryStatisticsOS()
     {
         try
         {
-            throwFromErrno(
-                    "File descriptor for \"" + std::string(filename) + "\" could not be closed. "
-                    "Something seems to have gone wrong. Inspect errno.", ErrorCodes::CANNOT_CLOSE_FILE);
+            ErrnoException::throwFromPath(
+                ErrorCodes::CANNOT_CLOSE_FILE, filename, "File descriptor for '{}' could not be closed", filename);
         }
         catch (const ErrnoException &)
         {
@@ -77,7 +77,7 @@ MemoryStatisticsOS::Data MemoryStatisticsOS::get() const
             if (errno == EINTR)
                 continue;
 
-            throwFromErrno("Cannot read from file " + std::string(filename), ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, filename, "Cannot read from file {}", filename);
         }
 
         assert(res >= 0);
@@ -136,7 +136,7 @@ MemoryStatisticsOS::Data MemoryStatisticsOS::get() const
     size_t len = sizeof(struct kinfo_proc);
 
     if (-1 == ::sysctl(mib, 4, &kp, &len, nullptr, 0))
-        throwFromErrno("Cannot sysctl(kern.proc.pid." + std::to_string(self) + ")", ErrorCodes::SYSTEM_ERROR);
+        throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot sysctl(kern.proc.pid.{})", std::to_string(self));
 
     if (sizeof(struct kinfo_proc) != len)
         throw DB::Exception(DB::ErrorCodes::SYSTEM_ERROR, "Kernel returns structure of {} bytes instead of expected {}",
diff --git a/src/Common/NamePrompter.h b/src/Common/NamePrompter.h
index 97c345414bb..cc72554657f 100644
--- a/src/Common/NamePrompter.h
+++ b/src/Common/NamePrompter.h
@@ -1,7 +1,6 @@
 #pragma once
 
 #include <base/types.h>
-#include <Common/PODArray.h>
 #include <Common/levenshteinDistance.h>
 
 #include <algorithm>
diff --git a/src/Common/NetlinkMetricsProvider.cpp b/src/Common/NetlinkMetricsProvider.cpp
index 4c228bcc6fc..23173f31689 100644
--- a/src/Common/NetlinkMetricsProvider.cpp
+++ b/src/Common/NetlinkMetricsProvider.cpp
@@ -117,7 +117,7 @@ struct NetlinkMessage
                 if (errno == EAGAIN)
                     continue;
                 else
-                    throwFromErrno("Can't send a Netlink command", ErrorCodes::NETLINK_ERROR);
+                    throw ErrnoException(ErrorCodes::NETLINK_ERROR, "Can't send a Netlink command");
             }
 
             if (bytes_sent > request_size)
@@ -255,7 +255,7 @@ NetlinkMetricsProvider::NetlinkMetricsProvider()
 {
     netlink_socket_fd = ::socket(PF_NETLINK, SOCK_RAW, NETLINK_GENERIC);
     if (netlink_socket_fd < 0)
-        throwFromErrno("Can't create PF_NETLINK socket", ErrorCodes::NETLINK_ERROR);
+        throw ErrnoException(ErrorCodes::NETLINK_ERROR, "Can't create PF_NETLINK socket");
 
     try
     {
@@ -267,7 +267,7 @@ NetlinkMetricsProvider::NetlinkMetricsProvider()
         tv.tv_usec = 50000;
 
         if (0 != ::setsockopt(netlink_socket_fd, SOL_SOCKET, SO_RCVTIMEO, reinterpret_cast<const char *>(&tv), sizeof(tv)))
-            throwFromErrno("Can't set timeout on PF_NETLINK socket", ErrorCodes::NETLINK_ERROR);
+            throw ErrnoException(ErrorCodes::NETLINK_ERROR, "Can't set timeout on PF_NETLINK socket");
 
         union
         {
@@ -277,7 +277,7 @@ NetlinkMetricsProvider::NetlinkMetricsProvider()
         addr.nl_family = AF_NETLINK;
 
         if (::bind(netlink_socket_fd, &sockaddr, sizeof(addr)) < 0)
-            throwFromErrno("Can't bind PF_NETLINK socket", ErrorCodes::NETLINK_ERROR);
+            throw ErrnoException(ErrorCodes::NETLINK_ERROR, "Can't bind PF_NETLINK socket");
 
         taskstats_family_id = getFamilyId(netlink_socket_fd);
     }
diff --git a/src/Common/OpenTelemetryTraceContext.cpp b/src/Common/OpenTelemetryTraceContext.cpp
index ab1a430cebb..92803af93a9 100644
--- a/src/Common/OpenTelemetryTraceContext.cpp
+++ b/src/Common/OpenTelemetryTraceContext.cpp
@@ -2,6 +2,7 @@
 
 #include <random>
 #include <base/getThreadId.h>
+#include <Common/thread_local_rng.h>
 #include <Common/Exception.h>
 #include <base/hex.h>
 #include <Core/Settings.h>
diff --git a/src/Common/PODArray.cpp b/src/Common/PODArray.cpp
index d21dc40867d..dd1fed08cb5 100644
--- a/src/Common/PODArray.cpp
+++ b/src/Common/PODArray.cpp
@@ -1,8 +1,46 @@
+#include <Common/Exception.h>
 #include <Common/PODArray.h>
 
+
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int CANNOT_MPROTECT;
+    extern const int CANNOT_ALLOCATE_MEMORY;
+}
+
+namespace PODArrayDetails
+{
+
+#ifndef NDEBUG
+void protectMemoryRegion(void * addr, size_t len, int prot)
+{
+    if (0 != mprotect(addr, len, prot))
+        throw ErrnoException(ErrorCodes::CANNOT_MPROTECT, "Cannot mprotect memory region");
+}
+#endif
+
+size_t byte_size(size_t num_elements, size_t element_size)
+{
+    size_t amount;
+    if (__builtin_mul_overflow(num_elements, element_size, &amount))
+        throw Exception(ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Amount of memory requested to allocate is more than allowed");
+    return amount;
+}
+
+size_t minimum_memory_for_elements(size_t num_elements, size_t element_size, size_t pad_left, size_t pad_right)
+{
+    size_t amount;
+    if (__builtin_add_overflow(byte_size(num_elements, element_size), pad_left + pad_right, &amount))
+        throw Exception(ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Amount of memory requested to allocate is more than allowed");
+    return amount;
+}
+
+}
+
+
 /// Used for left padding of PODArray when empty
 const char empty_pod_array[empty_pod_array_size]{};
 
@@ -25,4 +63,5 @@ template class PODArray<Int8, 4096, Allocator<false>, 0, 0>;
 template class PODArray<Int16, 4096, Allocator<false>, 0, 0>;
 template class PODArray<Int32, 4096, Allocator<false>, 0, 0>;
 template class PODArray<Int64, 4096, Allocator<false>, 0, 0>;
+
 }
diff --git a/src/Common/PODArray.h b/src/Common/PODArray.h
index 68c1e325f0c..6a048d1c6c0 100644
--- a/src/Common/PODArray.h
+++ b/src/Common/PODArray.h
@@ -1,27 +1,21 @@
 #pragma once
 
+#include <Common/Allocator.h>
+#include <Common/BitHelpers.h>
+#include <Common/memcpySmall.h>
+#include <Common/PODArray_fwd.h>
+#include <base/getPageSize.h>
+#include <boost/noncopyable.hpp>
 #include <cstring>
 #include <cstddef>
 #include <cassert>
 #include <algorithm>
 #include <memory>
 
-#include <boost/noncopyable.hpp>
-
-#include <base/strong_typedef.h>
-#include <base/getPageSize.h>
-
-#include <Common/Allocator.h>
-#include <Common/Exception.h>
-#include <Common/BitHelpers.h>
-#include <Common/memcpySmall.h>
-
 #ifndef NDEBUG
-    #include <sys/mman.h>
+#include <sys/mman.h>
 #endif
 
-#include <Common/PODArray_fwd.h>
-
 /** Whether we can use memcpy instead of a loop with assignment to T from U.
   * It is Ok if types are the same. And if types are integral and of the same size,
   *  example: char, signed char, unsigned char.
@@ -35,12 +29,6 @@ constexpr bool memcpy_can_be_used_for_assignment = std::is_same_v<T, U>
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int CANNOT_MPROTECT;
-    extern const int CANNOT_ALLOCATE_MEMORY;
-}
-
 /** A dynamic array for POD types.
   * Designed for a small number of large arrays (rather than a lot of small ones).
   * To be more precise - for use in ColumnVector.
@@ -77,6 +65,19 @@ namespace ErrorCodes
 static constexpr size_t empty_pod_array_size = 1024;
 extern const char empty_pod_array[empty_pod_array_size];
 
+namespace PODArrayDetails
+{
+
+void protectMemoryRegion(void * addr, size_t len, int prot);
+
+/// The amount of memory occupied by the num_elements of the elements.
+size_t byte_size(size_t num_elements, size_t element_size); /// NOLINT
+
+/// Minimum amount of memory to allocate for num_elements, including padding.
+size_t minimum_memory_for_elements(size_t num_elements, size_t element_size, size_t pad_left, size_t pad_right); /// NOLINT
+
+};
+
 /** Base class that depend only on size of element, not on element itself.
   * You can static_cast to this class if you want to insert some data regardless to the actual type T.
   */
@@ -102,27 +103,9 @@ protected:
     char * c_end            = null;
     char * c_end_of_storage = null;    /// Does not include pad_right.
 
-    /// The amount of memory occupied by the num_elements of the elements.
-    static size_t byte_size(size_t num_elements) /// NOLINT
-    {
-        size_t amount;
-        if (__builtin_mul_overflow(num_elements, ELEMENT_SIZE, &amount))
-            throw Exception(ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Amount of memory requested to allocate is more than allowed");
-        return amount;
-    }
-
-    /// Minimum amount of memory to allocate for num_elements, including padding.
-    static size_t minimum_memory_for_elements(size_t num_elements)
-    {
-        size_t amount;
-        if (__builtin_add_overflow(byte_size(num_elements), pad_left + pad_right, &amount))
-            throw Exception(ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Amount of memory requested to allocate is more than allowed");
-        return amount;
-    }
-
     void alloc_for_num_elements(size_t num_elements) /// NOLINT
     {
-        alloc(minimum_memory_for_elements(num_elements));
+        alloc(PODArrayDetails::minimum_memory_for_elements(num_elements, ELEMENT_SIZE, pad_left, pad_right));
     }
 
     template <typename ... TAllocatorParams>
@@ -188,7 +171,7 @@ protected:
             // The allocated memory should be multiplication of ELEMENT_SIZE to hold the element, otherwise,
             // memory issue such as corruption could appear in edge case.
             realloc(std::max(integerRoundUp(initial_bytes, ELEMENT_SIZE),
-                             minimum_memory_for_elements(1)),
+                             PODArrayDetails::minimum_memory_for_elements(1, ELEMENT_SIZE, pad_left, pad_right)),
                     std::forward<TAllocatorParams>(allocator_params)...);
         }
         else
@@ -208,8 +191,7 @@ protected:
         if (right_rounded_down > left_rounded_up)
         {
             size_t length = right_rounded_down - left_rounded_up;
-            if (0 != mprotect(left_rounded_up, length, prot))
-                throwFromErrno("Cannot mprotect memory region", ErrorCodes::CANNOT_MPROTECT);
+            PODArrayDetails::protectMemoryRegion(left_rounded_up, length, prot);
         }
     }
 
@@ -232,14 +214,14 @@ public:
     void reserve(size_t n, TAllocatorParams &&... allocator_params)
     {
         if (n > capacity())
-            realloc(roundUpToPowerOfTwoOrZero(minimum_memory_for_elements(n)), std::forward<TAllocatorParams>(allocator_params)...);
+            realloc(roundUpToPowerOfTwoOrZero(PODArrayDetails::minimum_memory_for_elements(n, ELEMENT_SIZE, pad_left, pad_right)), std::forward<TAllocatorParams>(allocator_params)...);
     }
 
     template <typename ... TAllocatorParams>
     void reserve_exact(size_t n, TAllocatorParams &&... allocator_params) /// NOLINT
     {
         if (n > capacity())
-            realloc(minimum_memory_for_elements(n), std::forward<TAllocatorParams>(allocator_params)...);
+            realloc(PODArrayDetails::minimum_memory_for_elements(n, ELEMENT_SIZE, pad_left, pad_right), std::forward<TAllocatorParams>(allocator_params)...);
     }
 
     template <typename ... TAllocatorParams>
@@ -258,7 +240,7 @@ public:
 
     void resize_assume_reserved(const size_t n) /// NOLINT
     {
-        c_end = c_start + byte_size(n);
+        c_end = c_start + PODArrayDetails::byte_size(n, ELEMENT_SIZE);
     }
 
     const char * raw_data() const /// NOLINT
@@ -339,7 +321,7 @@ public:
     explicit PODArray(size_t n)
     {
         this->alloc_for_num_elements(n);
-        this->c_end += this->byte_size(n);
+        this->c_end += PODArrayDetails::byte_size(n, sizeof(T));
     }
 
     PODArray(size_t n, const T & x)
@@ -411,9 +393,9 @@ public:
         if (n > old_size)
         {
             this->reserve(n);
-            memset(this->c_end, 0, this->byte_size(n - old_size));
+            memset(this->c_end, 0, PODArrayDetails::byte_size(n - old_size, sizeof(T)));
         }
-        this->c_end = this->c_start + this->byte_size(n);
+        this->c_end = this->c_start + PODArrayDetails::byte_size(n, sizeof(T));
     }
 
     void resize_fill(size_t n, const T & value) /// NOLINT
@@ -424,7 +406,7 @@ public:
             this->reserve(n);
             std::fill(t_end(), t_end() + n - old_size, value);
         }
-        this->c_end = this->c_start + this->byte_size(n);
+        this->c_end = this->c_start + PODArrayDetails::byte_size(n, sizeof(T));
     }
 
     template <typename U, typename ... TAllocatorParams>
@@ -487,7 +469,7 @@ public:
         if (required_capacity > this->capacity())
             this->reserve(roundUpToPowerOfTwoOrZero(required_capacity), std::forward<TAllocatorParams>(allocator_params)...);
 
-        size_t bytes_to_copy = this->byte_size(from_end - from_begin);
+        size_t bytes_to_copy = PODArrayDetails::byte_size(from_end - from_begin, sizeof(T));
         if (bytes_to_copy)
         {
             memcpy(this->c_end, reinterpret_cast<const void *>(rhs.begin() + from_begin), bytes_to_copy);
@@ -502,7 +484,7 @@ public:
         static_assert(pad_right_ >= PADDING_FOR_SIMD - 1);
         static_assert(sizeof(T) == sizeof(*from_begin));
         insertPrepare(from_begin, from_end, std::forward<TAllocatorParams>(allocator_params)...);
-        size_t bytes_to_copy = this->byte_size(from_end - from_begin);
+        size_t bytes_to_copy = PODArrayDetails::byte_size(from_end - from_begin, sizeof(T));
         memcpySmallAllowReadWriteOverflow15(this->c_end, reinterpret_cast<const void *>(&*from_begin), bytes_to_copy);
         this->c_end += bytes_to_copy;
     }
@@ -513,11 +495,11 @@ public:
     {
         static_assert(memcpy_can_be_used_for_assignment<std::decay_t<T>, std::decay_t<decltype(*from_begin)>>);
 
-        size_t bytes_to_copy = this->byte_size(from_end - from_begin);
+        size_t bytes_to_copy = PODArrayDetails::byte_size(from_end - from_begin, sizeof(T));
         if (!bytes_to_copy)
             return;
 
-        size_t bytes_to_move = this->byte_size(end() - it);
+        size_t bytes_to_move = PODArrayDetails::byte_size(end() - it, sizeof(T));
 
         insertPrepare(from_begin, from_end);
 
@@ -545,10 +527,10 @@ public:
         if (required_capacity > this->capacity())
             this->reserve(roundUpToPowerOfTwoOrZero(required_capacity), std::forward<TAllocatorParams>(allocator_params)...);
 
-        size_t bytes_to_copy = this->byte_size(copy_size);
+        size_t bytes_to_copy = PODArrayDetails::byte_size(copy_size, sizeof(T));
         if (bytes_to_copy)
         {
-            auto begin = this->c_start + this->byte_size(start_index);
+            auto begin = this->c_start + PODArrayDetails::byte_size(start_index, sizeof(T));
             memcpy(this->c_end, reinterpret_cast<const void *>(&*begin), bytes_to_copy);
             this->c_end += bytes_to_copy;
         }
@@ -560,7 +542,7 @@ public:
         static_assert(memcpy_can_be_used_for_assignment<std::decay_t<T>, std::decay_t<decltype(*from_begin)>>);
         this->assertNotIntersects(from_begin, from_end);
 
-        size_t bytes_to_copy = this->byte_size(from_end - from_begin);
+        size_t bytes_to_copy = PODArrayDetails::byte_size(from_end - from_begin, sizeof(T));
         if (bytes_to_copy)
         {
             memcpy(this->c_end, reinterpret_cast<const void *>(&*from_begin), bytes_to_copy);
@@ -593,13 +575,13 @@ public:
             /// arr1 takes ownership of the heap memory of arr2.
             arr1.c_start = arr2.c_start;
             arr1.c_end_of_storage = arr1.c_start + heap_allocated - arr2.pad_right - arr2.pad_left;
-            arr1.c_end = arr1.c_start + this->byte_size(heap_size);
+            arr1.c_end = arr1.c_start + PODArrayDetails::byte_size(heap_size, sizeof(T));
 
             /// Allocate stack space for arr2.
             arr2.alloc(stack_allocated, std::forward<TAllocatorParams>(allocator_params)...);
             /// Copy the stack content.
-            memcpy(arr2.c_start, stack_c_start, this->byte_size(stack_size));
-            arr2.c_end = arr2.c_start + this->byte_size(stack_size);
+            memcpy(arr2.c_start, stack_c_start, PODArrayDetails::byte_size(stack_size, sizeof(T)));
+            arr2.c_end = arr2.c_start + PODArrayDetails::byte_size(stack_size, sizeof(T));
         };
 
         auto do_move = [&](PODArray & src, PODArray & dest)
@@ -608,8 +590,8 @@ public:
             {
                 dest.dealloc();
                 dest.alloc(src.allocated_bytes(), std::forward<TAllocatorParams>(allocator_params)...);
-                memcpy(dest.c_start, src.c_start, this->byte_size(src.size()));
-                dest.c_end = dest.c_start + this->byte_size(src.size());
+                memcpy(dest.c_start, src.c_start, PODArrayDetails::byte_size(src.size(), sizeof(T)));
+                dest.c_end = dest.c_start + PODArrayDetails::byte_size(src.size(), sizeof(T));
 
                 src.c_start = Base::null;
                 src.c_end = Base::null;
@@ -666,8 +648,8 @@ public:
             this->c_end_of_storage = this->c_start + rhs_allocated - Base::pad_right - Base::pad_left;
             rhs.c_end_of_storage = rhs.c_start + lhs_allocated - Base::pad_right - Base::pad_left;
 
-            this->c_end = this->c_start + this->byte_size(rhs_size);
-            rhs.c_end = rhs.c_start + this->byte_size(lhs_size);
+            this->c_end = this->c_start + PODArrayDetails::byte_size(rhs_size, sizeof(T));
+            rhs.c_end = rhs.c_start + PODArrayDetails::byte_size(lhs_size, sizeof(T));
         }
         else if (this->isAllocatedFromStack() && !rhs.isAllocatedFromStack())
         {
@@ -702,7 +684,7 @@ public:
         if (required_capacity > this->capacity())
             this->reserve_exact(required_capacity, std::forward<TAllocatorParams>(allocator_params)...);
 
-        size_t bytes_to_copy = this->byte_size(required_capacity);
+        size_t bytes_to_copy = PODArrayDetails::byte_size(required_capacity, sizeof(T));
         if (bytes_to_copy)
             memcpy(this->c_start, reinterpret_cast<const void *>(&*from_begin), bytes_to_copy);
 
diff --git a/src/Common/PipeFDs.cpp b/src/Common/PipeFDs.cpp
index 21a9ae59972..f2a913467a9 100644
--- a/src/Common/PipeFDs.cpp
+++ b/src/Common/PipeFDs.cpp
@@ -29,14 +29,14 @@ void LazyPipeFDs::open()
 
 #ifndef OS_DARWIN
     if (0 != pipe2(fds_rw, O_CLOEXEC))
-        throwFromErrno("Cannot create pipe", ErrorCodes::CANNOT_PIPE);
+        throw ErrnoException(ErrorCodes::CANNOT_PIPE, "Cannot create pipe");
 #else
     if (0 != pipe(fds_rw))
-        throwFromErrno("Cannot create pipe", ErrorCodes::CANNOT_PIPE);
+        throw ErrnoException(ErrorCodes::CANNOT_PIPE, "Cannot create pipe");
     if (0 != fcntl(fds_rw[0], F_SETFD, FD_CLOEXEC))
-        throwFromErrno("Cannot setup auto-close on exec for read end of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot setup auto-close on exec for read end of pipe");
     if (0 != fcntl(fds_rw[1], F_SETFD, FD_CLOEXEC))
-        throwFromErrno("Cannot setup auto-close on exec for write end of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot setup auto-close on exec for write end of pipe");
 #endif
 }
 
@@ -47,7 +47,7 @@ void LazyPipeFDs::close()
         if (fd < 0)
             continue;
         if (0 != ::close(fd))
-            throwFromErrno("Cannot close pipe", ErrorCodes::CANNOT_PIPE);
+            throw ErrnoException(ErrorCodes::CANNOT_PIPE, "Cannot close pipe");
         fd = -1;
     }
 }
@@ -74,18 +74,18 @@ void LazyPipeFDs::setNonBlockingWrite()
 {
     int flags = fcntl(fds_rw[1], F_GETFL, 0);
     if (-1 == flags)
-        throwFromErrno("Cannot get file status flags of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot get file status flags of pipe");
     if (-1 == fcntl(fds_rw[1], F_SETFL, flags | O_NONBLOCK))
-        throwFromErrno("Cannot set non-blocking mode of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot set non-blocking mode of pipe");
 }
 
 void LazyPipeFDs::setNonBlockingRead()
 {
     int flags = fcntl(fds_rw[0], F_GETFL, 0);
     if (-1 == flags)
-        throwFromErrno("Cannot get file status flags of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot get file status flags of pipe");
     if (-1 == fcntl(fds_rw[0], F_SETFL, flags | O_NONBLOCK))
-        throwFromErrno("Cannot set non-blocking mode of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot set non-blocking mode of pipe");
 }
 
 void LazyPipeFDs::setNonBlockingReadWrite()
@@ -110,13 +110,13 @@ void LazyPipeFDs::tryIncreaseSize(int desired_size)
             /// It will work nevertheless.
         }
         else
-            throwFromErrno("Cannot get pipe capacity", ErrorCodes::CANNOT_FCNTL);
+            throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot get pipe capacity");
     }
     else
     {
         for (errno = 0; errno != EPERM && pipe_size < desired_size; pipe_size *= 2)
             if (-1 == fcntl(fds_rw[1], F_SETPIPE_SZ, pipe_size * 2) && errno != EPERM)
-                throwFromErrno("Cannot increase pipe capacity to " + std::to_string(pipe_size * 2), ErrorCodes::CANNOT_FCNTL);
+                throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot increase pipe capacity to {}", pipe_size * 2);
 
         LOG_TRACE(log, "Pipe capacity is {}", ReadableSize(std::min(pipe_size, desired_size)));
     }
diff --git a/src/Common/PoolWithFailoverBase.h b/src/Common/PoolWithFailoverBase.h
index c6f44a7701a..543a39fbc39 100644
--- a/src/Common/PoolWithFailoverBase.h
+++ b/src/Common/PoolWithFailoverBase.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <time.h>
+#include <ctime>
 #include <cstdlib>
 #include <climits>
 #include <random>
@@ -180,6 +180,7 @@ PoolWithFailoverBase<TNestedPool>::getShuffledPools(
     shuffled_pools.reserve(nested_pools.size());
     for (size_t i = 0; i < nested_pools.size(); ++i)
         shuffled_pools.push_back(ShuffledPool{nested_pools[i].get(), &pool_states[i], i, /* error_count = */ 0, /* slowdown_count = */ 0});
+
     ::sort(
         shuffled_pools.begin(), shuffled_pools.end(),
         [](const ShuffledPool & lhs, const ShuffledPool & rhs)
diff --git a/src/Common/ProcfsMetricsProvider.cpp b/src/Common/ProcfsMetricsProvider.cpp
index 7a94cecee5e..194053cd271 100644
--- a/src/Common/ProcfsMetricsProvider.cpp
+++ b/src/Common/ProcfsMetricsProvider.cpp
@@ -37,18 +37,15 @@ namespace
 {
 [[noreturn]] inline void throwWithFailedToOpenFile(const std::string & filename)
 {
-    throwFromErrno(
-            "Cannot open file " + filename,
-            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+    ErrnoException::throwFromPath(
+        errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, filename, "Cannot open file {}", filename);
 }
 
 inline void emitErrorMsgWithFailedToCloseFile(const std::string & filename)
 {
     try
     {
-        throwFromErrno(
-                "File descriptor for \"" + filename + "\" could not be closed. "
-                "Something seems to have gone wrong. Inspect errno.", ErrorCodes::CANNOT_CLOSE_FILE);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_CLOSE_FILE, filename, "File descriptor for {} could not be closed", filename);
     }
     catch (const ErrnoException &)
     {
@@ -69,9 +66,7 @@ ssize_t readFromFD(const int fd, const char * filename, char * buf, size_t buf_s
             if (errno == EINTR)
                 continue;
 
-            throwFromErrno(
-                    "Cannot read from file " + std::string(filename),
-                    ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, filename, "Cannot read from file {}", filename);
         }
 
         assert(res >= 0);
diff --git a/src/Common/ProfileEvents.cpp b/src/Common/ProfileEvents.cpp
index 9908b037238..4bdf6288a1c 100644
--- a/src/Common/ProfileEvents.cpp
+++ b/src/Common/ProfileEvents.cpp
@@ -238,6 +238,7 @@
     M(DictCacheLockReadNs, "Number of nanoseconds spend in waiting for read lock to lookup the data for the dictionaries of 'cache' types.") \
     \
     M(DistributedSyncInsertionTimeoutExceeded, "A timeout has exceeded while waiting for shards during synchronous insertion into a Distributed table (with 'distributed_foreground_insert' = 1)") \
+    M(DistributedAsyncInsertionFailures, "Number of failures for asynchronous insertion into a Distributed table (with 'distributed_foreground_insert' = 0)") \
     M(DataAfterMergeDiffersFromReplica, R"(
 Number of times data after merge is not byte-identical to the data on another replicas. There could be several reasons:
 1. Using newer version of compression library after server update.
@@ -249,9 +250,9 @@ Number of times data after merge is not byte-identical to the data on another re
 7. Manual modification of source data after server startup.
 8. Manual modification of checksums stored in ZooKeeper.
 9. Part format related settings like 'enable_mixed_granularity_parts' are different on different replicas.
-The server successfully detected this situation and will download merged part from replica to force byte-identical result.
+The server successfully detected this situation and will download merged part from the replica to force the byte-identical result.
 )") \
-    M(DataAfterMutationDiffersFromReplica, "Number of times data after mutation is not byte-identical to the data on another replicas. In addition to the reasons described in 'DataAfterMergeDiffersFromReplica', it is also possible due to non-deterministic mutation.") \
+    M(DataAfterMutationDiffersFromReplica, "Number of times data after mutation is not byte-identical to the data on other replicas. In addition to the reasons described in 'DataAfterMergeDiffersFromReplica', it is also possible due to non-deterministic mutation.") \
     M(PolygonsAddedToPool, "A polygon has been added to the cache (pool) for the 'pointInPolygon' function.") \
     M(PolygonsInPoolAllocatedBytes, "The number of bytes for polygons added to the cache (pool) for the 'pointInPolygon' function.") \
     \
@@ -271,12 +272,12 @@ The server successfully detected this situation and will download merged part fr
     M(PartsLockWaitMicroseconds, "Total time spent waiting for data parts lock in MergeTree tables") \
     \
     M(RealTimeMicroseconds, "Total (wall clock) time spent in processing (queries and other tasks) threads (note that this is a sum).") \
-    M(UserTimeMicroseconds, "Total time spent in processing (queries and other tasks) threads executing CPU instructions in user mode. This include time CPU pipeline was stalled due to main memory access, cache misses, branch mispredictions, hyper-threading, etc.") \
+    M(UserTimeMicroseconds, "Total time spent in processing (queries and other tasks) threads executing CPU instructions in user mode. This includes time CPU pipeline was stalled due to main memory access, cache misses, branch mispredictions, hyper-threading, etc.") \
     M(SystemTimeMicroseconds, "Total time spent in processing (queries and other tasks) threads executing CPU instructions in OS kernel mode. This is time spent in syscalls, excluding waiting time during blocking syscalls.") \
     M(MemoryOvercommitWaitTimeMicroseconds, "Total time spent in waiting for memory to be freed in OvercommitTracker.") \
     M(MemoryAllocatorPurge, "Total number of times memory allocator purge was requested") \
     M(MemoryAllocatorPurgeTimeMicroseconds, "Total number of times memory allocator purge was requested") \
-    M(SoftPageFaults, "The number of soft page faults in query execution threads. Soft page fault usually means a miss in the memory allocator cache which required a new memory mapping from the OS and subsequent allocation of a page of physical memory.") \
+    M(SoftPageFaults, "The number of soft page faults in query execution threads. Soft page fault usually means a miss in the memory allocator cache, which requires a new memory mapping from the OS and subsequent allocation of a page of physical memory.") \
     M(HardPageFaults, "The number of hard page faults in query execution threads. High values indicate either that you forgot to turn off swap on your server, or eviction of memory pages of the ClickHouse binary during very high memory pressure, or successful usage of the 'mmap' read method for the tables data.") \
     \
     M(OSIOWaitMicroseconds, "Total time a thread spent waiting for a result of IO operation, from the OS point of view. This is real IO that doesn't include page cache.") \
@@ -289,8 +290,8 @@ The server successfully detected this situation and will download merged part fr
     \
     M(PerfCpuCycles, "Total cycles. Be wary of what happens during CPU frequency scaling.")  \
     M(PerfInstructions, "Retired instructions. Be careful, these can be affected by various issues, most notably hardware interrupt counts.") \
-    M(PerfCacheReferences, "Cache accesses. Usually this indicates Last Level Cache accesses but this may vary depending on your CPU. This may include prefetches and coherency messages; again this depends on the design of your CPU.") \
-    M(PerfCacheMisses, "Cache misses. Usually this indicates Last Level Cache misses; this is intended to be used in con‐junction with the PERFCOUNTHWCACHEREFERENCES event to calculate cache miss rates.") \
+    M(PerfCacheReferences, "Cache accesses. Usually, this indicates Last Level Cache accesses, but this may vary depending on your CPU. This may include prefetches and coherency messages; again this depends on the design of your CPU.") \
+    M(PerfCacheMisses, "Cache misses. Usually this indicates Last Level Cache misses; this is intended to be used in conjunction with the PERFCOUNTHWCACHEREFERENCES event to calculate cache miss rates.") \
     M(PerfBranchInstructions, "Retired branch instructions. Prior to Linux 2.6.35, this used the wrong event on AMD processors.") \
     M(PerfBranchMisses, "Mispredicted branch instructions.") \
     M(PerfBusCycles, "Bus cycles, which can be different from total cycles.") \
@@ -450,25 +451,27 @@ The server successfully detected this situation and will download merged part fr
     M(ThreadpoolReaderSubmitReadSynchronously, "How many times we haven't scheduled a task on the thread pool and read synchronously instead") \
     M(ThreadpoolReaderSubmitReadSynchronouslyBytes, "How many bytes were read synchronously") \
     M(ThreadpoolReaderSubmitReadSynchronouslyMicroseconds, "How much time we spent reading synchronously") \
+    M(ThreadpoolReaderSubmitLookupInCacheMicroseconds, "How much time we spent checking if content is cached") \
     M(AsynchronousReaderIgnoredBytes, "Number of bytes ignored during asynchronous reading") \
     \
     M(FileSegmentWaitReadBufferMicroseconds, "Metric per file segment. Time spend waiting for internal read buffer (includes cache waiting)") \
     M(FileSegmentReadMicroseconds, "Metric per file segment. Time spend reading from file") \
     M(FileSegmentCacheWriteMicroseconds, "Metric per file segment. Time spend writing data to cache") \
-    M(FileSegmentPredownloadMicroseconds, "Metric per file segment. Time spent predownloading data to cache (predownloading - finishing file segment download (after someone who failed to do that) up to the point current thread was requested to do)") \
+    M(FileSegmentPredownloadMicroseconds, "Metric per file segment. Time spent pre-downloading data to cache (pre-downloading - finishing file segment download (after someone who failed to do that) up to the point current thread was requested to do)") \
     M(FileSegmentUsedBytes, "Metric per file segment. How many bytes were actually used from current file segment") \
     \
     M(ReadBufferSeekCancelConnection, "Number of seeks which lead to new connection (s3, http)") \
     \
     M(SleepFunctionCalls, "Number of times a sleep function (sleep, sleepEachRow) has been called.") \
-    M(SleepFunctionMicroseconds, "Time spent sleeping due to a sleep function call.") \
+    M(SleepFunctionMicroseconds, "Time set to sleep in a sleep function (sleep, sleepEachRow).") \
+    M(SleepFunctionElapsedMicroseconds, "Time spent sleeping in a sleep function (sleep, sleepEachRow).") \
     \
-    M(ThreadPoolReaderPageCacheHit, "Number of times the read inside ThreadPoolReader was done from page cache.") \
-    M(ThreadPoolReaderPageCacheHitBytes, "Number of bytes read inside ThreadPoolReader when it was done from page cache.") \
+    M(ThreadPoolReaderPageCacheHit, "Number of times the read inside ThreadPoolReader was done from the page cache.") \
+    M(ThreadPoolReaderPageCacheHitBytes, "Number of bytes read inside ThreadPoolReader when it was done from the page cache.") \
     M(ThreadPoolReaderPageCacheHitElapsedMicroseconds, "Time spent reading data from page cache in ThreadPoolReader.") \
     M(ThreadPoolReaderPageCacheMiss, "Number of times the read inside ThreadPoolReader was not done from page cache and was hand off to thread pool.") \
     M(ThreadPoolReaderPageCacheMissBytes, "Number of bytes read inside ThreadPoolReader when read was not done from page cache and was hand off to thread pool.") \
-    M(ThreadPoolReaderPageCacheMissElapsedMicroseconds, "Time spent reading data inside the asynchronous job in ThreadPoolReader - when read was not done from page cache.") \
+    M(ThreadPoolReaderPageCacheMissElapsedMicroseconds, "Time spent reading data inside the asynchronous job in ThreadPoolReader - when read was not done from the page cache.") \
     \
     M(AsynchronousReadWaitMicroseconds, "Time spent in waiting for asynchronous reads in asynchronous local read.") \
     M(SynchronousReadWaitMicroseconds, "Time spent in waiting for synchronous reads in asynchronous local read.") \
@@ -509,7 +512,7 @@ The server successfully detected this situation and will download merged part fr
     M(SchemaInferenceCacheSchemaHits, "Number of times the schema is found in schema cache during schema inference") \
     M(SchemaInferenceCacheNumRowsHits, "Number of times the number of rows is found in schema cache during count from files") \
     M(SchemaInferenceCacheMisses, "Number of times the requested source is not in schema cache") \
-    M(SchemaInferenceCacheSchemaMisses, "Number of times the requested source is in cache but the schema is not in cache while schema inference") \
+    M(SchemaInferenceCacheSchemaMisses, "Number of times the requested source is in cache but the schema is not in cache during schema inference") \
     M(SchemaInferenceCacheNumRowsMisses, "Number of times the requested source is in cache but the number of rows is not in cache while count from files") \
     M(SchemaInferenceCacheEvictions, "Number of times a schema from cache was evicted due to overflow") \
     M(SchemaInferenceCacheInvalidations, "Number of times a schema in cache became invalid due to changes in data") \
@@ -567,7 +570,7 @@ The server successfully detected this situation and will download merged part fr
     \
     M(ReadTaskRequestsSent, "The number of callbacks requested from the remote server back to the initiator server to choose the read task (for s3Cluster table function and similar). Measured on the remote server side.") \
     M(MergeTreeReadTaskRequestsSent, "The number of callbacks requested from the remote server back to the initiator server to choose the read task (for MergeTree tables). Measured on the remote server side.") \
-    M(MergeTreeAllRangesAnnouncementsSent, "The number of announcement sent from the remote server to the initiator server about the set of data parts (for MergeTree tables). Measured on the remote server side.") \
+    M(MergeTreeAllRangesAnnouncementsSent, "The number of announcements sent from the remote server to the initiator server about the set of data parts (for MergeTree tables). Measured on the remote server side.") \
     M(ReadTaskRequestsSentElapsedMicroseconds, "Time spent in callbacks requested from the remote server back to the initiator server to choose the read task (for s3Cluster table function and similar). Measured on the remote server side.") \
     M(MergeTreeReadTaskRequestsSentElapsedMicroseconds, "Time spent in callbacks requested from the remote server back to the initiator server to choose the read task (for MergeTree tables). Measured on the remote server side.") \
     M(MergeTreeAllRangesAnnouncementsSentElapsedMicroseconds, "Time spent in sending the announcement from the remote server to the initiator server about the set of data parts (for MergeTree tables). Measured on the remote server side.") \
@@ -583,6 +586,8 @@ The server successfully detected this situation and will download merged part fr
     M(LogWarning, "Number of log messages with level Warning") \
     M(LogError, "Number of log messages with level Error") \
     M(LogFatal, "Number of log messages with level Fatal") \
+    \
+    M(ParallelReplicasUsedCount, "Number of replicas used to execute a query with task-based parallel replicas") \
 
 #ifdef APPLY_FOR_EXTERNAL_EVENTS
     #define APPLY_FOR_EVENTS(M) APPLY_FOR_BUILTIN_EVENTS(M) APPLY_FOR_EXTERNAL_EVENTS(M)
diff --git a/src/Common/QueryProfiler.cpp b/src/Common/QueryProfiler.cpp
index c656e7f992f..16c8d4e223f 100644
--- a/src/Common/QueryProfiler.cpp
+++ b/src/Common/QueryProfiler.cpp
@@ -141,7 +141,7 @@ void Timer::createIfNecessary(UInt64 thread_id, int clock_type, int pause_signal
 
             /// Also, it cannot be created if the server has too many threads.
 
-            throwFromErrno("Failed to create thread timer", ErrorCodes::CANNOT_CREATE_TIMER);
+            throw ErrnoException(ErrorCodes::CANNOT_CREATE_TIMER, "Failed to create thread timer");
         }
         timer_id.emplace(local_timer_id);
         CurrentMetrics::add(CurrentMetrics::CreatedTimersInQueryProfiler);
@@ -164,7 +164,7 @@ void Timer::set(UInt32 period)
 
     struct itimerspec timer_spec = {.it_interval = interval, .it_value = offset};
     if (timer_settime(*timer_id, 0, &timer_spec, nullptr))
-        throwFromErrno("Failed to set thread timer period", ErrorCodes::CANNOT_SET_TIMER_PERIOD);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_TIMER_PERIOD, "Failed to set thread timer period");
     CurrentMetrics::add(CurrentMetrics::ActiveTimersInQueryProfiler);
 }
 
@@ -238,13 +238,13 @@ QueryProfilerBase<ProfilerImpl>::QueryProfilerBase(UInt64 thread_id, int clock_t
     sa.sa_flags = SA_SIGINFO | SA_RESTART;
 
     if (sigemptyset(&sa.sa_mask))
-        throwFromErrno("Failed to clean signal mask for query profiler", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+        throw ErrnoException(ErrorCodes::CANNOT_MANIPULATE_SIGSET, "Failed to clean signal mask for query profiler");
 
     if (sigaddset(&sa.sa_mask, pause_signal))
-        throwFromErrno("Failed to add signal to mask for query profiler", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+        throw ErrnoException(ErrorCodes::CANNOT_MANIPULATE_SIGSET, "Failed to add signal to mask for query profiler");
 
     if (sigaction(pause_signal, &sa, nullptr))
-        throwFromErrno("Failed to setup signal handler for query profiler", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Failed to setup signal handler for query profiler");
 
     try
     {
diff --git a/src/Common/RWLock.cpp b/src/Common/RWLock.cpp
index 2d0fcfa3e74..c8a5c692494 100644
--- a/src/Common/RWLock.cpp
+++ b/src/Common/RWLock.cpp
@@ -3,6 +3,8 @@
 #include <Common/Exception.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/ProfileEvents.h>
+#include <IO/Operators.h>
+#include <IO/WriteBufferFromString.h>
 
 
 namespace ProfileEvents
@@ -155,25 +157,34 @@ RWLockImpl::getLock(RWLockImpl::Type type, const String & query_id, const std::c
 
     if (type == Type::Write)
     {
+        /// Always add a group for a writer (writes are never performed simultaneously).
         writers_queue.emplace_back(type);  /// SM1: may throw (nothing to roll back)
     }
-    else if (readers_queue.empty() ||
-            (rdlock_owner == readers_queue.begin() && readers_queue.size() == 1 && !writers_queue.empty()))
+    else
     {
-        readers_queue.emplace_back(type);  /// SM1: may throw (nothing to roll back)
+        /// We don't always add a group to readers_queue here because multiple readers can use the same group.
+        /// We can reuse the last group if the last group didn't get ownership yet,
+        /// or even if it got ownership but there are no writers waiting in writers_queue.
+        bool can_use_last_group = !readers_queue.empty() && (!readers_queue.back().ownership || writers_queue.empty());
+
+        if (!can_use_last_group)
+            readers_queue.emplace_back(type);  /// SM1: may throw (nothing to roll back)
     }
+
     GroupsContainer::iterator it_group =
             (type == Type::Write) ? std::prev(writers_queue.end()) : std::prev(readers_queue.end());
 
     /// Lock is free to acquire
     if (rdlock_owner == readers_queue.end() && wrlock_owner == writers_queue.end())
     {
+        /// Set `rdlock_owner` or `wrlock_owner` and make it owner.
         (type == Read ? rdlock_owner : wrlock_owner) = it_group;  /// SM2: nothrow
+        grantOwnership(it_group);
     }
     else
     {
         /// Wait until our group becomes the lock owner
-        const auto predicate = [&] () { return it_group == (type == Read ? rdlock_owner : wrlock_owner); };
+        const auto predicate = [&] () { return it_group->ownership; };
 
         if (lock_deadline_tp == std::chrono::time_point<std::chrono::steady_clock>::max())
         {
@@ -193,15 +204,20 @@ RWLockImpl::getLock(RWLockImpl::Type type, const String & query_id, const std::c
                 /// Rollback(SM1): nothrow
                 if (it_group->requests == 0)
                 {
-                    /// When WRITE lock fails, we need to notify next read that is waiting,
-                    /// to avoid handing request, hence next=true.
-                    dropOwnerGroupAndPassOwnership(it_group, /* next= */ true);
+                    ((type == Read) ? readers_queue : writers_queue).erase(it_group);
                 }
+                /// While we were waiting for this write lock (which has just failed) more readers could start waiting,
+                /// we need to wake up them now.
+                if ((rdlock_owner != readers_queue.end()) && writers_queue.empty())
+                    grantOwnershipToAllReaders();
                 return nullptr;
             }
         }
     }
 
+    /// Our group must be an owner here.
+    chassert(it_group->ownership);
+
     if (request_has_query_id)
     {
         try
@@ -216,7 +232,7 @@ RWLockImpl::getLock(RWLockImpl::Type type, const String & query_id, const std::c
             /// Methods std::list<>::emplace_back() and std::unordered_map<>::emplace() provide strong exception safety
             /// We only need to roll back the changes to these objects: owner_queries and the readers/writers queue
             if (it_group->requests == 0)
-                dropOwnerGroupAndPassOwnership(it_group, /* next= */ false);  /// Rollback(SM1): nothrow
+                dropOwnerGroupAndPassOwnership(it_group);  /// Rollback(SM1): nothrow
 
             throw;
         }
@@ -237,19 +253,28 @@ RWLockImpl::getLock(RWLockImpl::Type type, const String & query_id, const std::c
   * it is guaranteed that all three steps have been executed successfully and the resulting state is consistent.
   * With the mutex locked the order of steps to restore the lock's state can be arbitrary
   *
-  * We do not employ try-catch: if something bad happens, there is nothing we can do =(
+  * We do not employ try-catch: if something bad happens and chassert() is disabled, there is nothing we can do
+  * (we can't throw an exception here because RWLockImpl::unlock() is called from the destructor ~LockHolderImpl).
   */
 void RWLockImpl::unlock(GroupsContainer::iterator group_it, const String & query_id) noexcept
 {
     std::lock_guard state_lock(internal_state_mtx);
 
-    /// All of these are Undefined behavior and nothing we can do!
-    if (rdlock_owner == readers_queue.end() && wrlock_owner == writers_queue.end())
+    /// Our group must be an owner here.
+    if (!group_it->ownership)
+    {
+        chassert(false && "RWLockImpl::unlock() is called for a non-owner group");
         return;
-    if (rdlock_owner != readers_queue.end() && group_it != rdlock_owner)
-        return;
-    if (wrlock_owner != writers_queue.end() && group_it != wrlock_owner)
+    }
+
+    /// Check consistency.
+    if ((group_it->type == Read)
+            ? !(rdlock_owner != readers_queue.end() && wrlock_owner == writers_queue.end())
+            : !(wrlock_owner != writers_queue.end() && rdlock_owner == readers_queue.end() && group_it == wrlock_owner))
+    {
+        chassert(false && "RWLockImpl::unlock() found the rwlock inconsistent");
         return;
+    }
 
     /// If query_id is not empty it must be listed in parent->owner_queries
     if (query_id != NO_QUERY)
@@ -264,12 +289,26 @@ void RWLockImpl::unlock(GroupsContainer::iterator group_it, const String & query
 
     /// If we are the last remaining referrer, remove this QNode and notify the next one
     if (--group_it->requests == 0)               /// SM: nothrow
-        dropOwnerGroupAndPassOwnership(group_it, /* next= */ false);
+        dropOwnerGroupAndPassOwnership(group_it);
 }
 
 
-void RWLockImpl::dropOwnerGroupAndPassOwnership(GroupsContainer::iterator group_it, bool next) noexcept
+void RWLockImpl::dropOwnerGroupAndPassOwnership(GroupsContainer::iterator group_it) noexcept
 {
+    /// All readers with ownership must finish before switching to write phase.
+    /// Such readers has iterators from `readers_queue.begin()` to `rdlock_owner`, so if `rdlock_owner` is equal to `readers_queue.begin()`
+    /// that means there is only one reader with ownership left in the readers_queue and we can proceed to generic procedure.
+    if ((group_it->type == Read) && (rdlock_owner != readers_queue.begin()) && (rdlock_owner != readers_queue.end()))
+    {
+        if (rdlock_owner == group_it)
+            --rdlock_owner;
+        readers_queue.erase(group_it);
+        /// If there are no writers waiting in writers_queue then we can wake up other readers.
+        if (writers_queue.empty())
+            grantOwnershipToAllReaders();
+        return;
+    }
+
     rdlock_owner = readers_queue.end();
     wrlock_owner = writers_queue.end();
 
@@ -278,42 +317,86 @@ void RWLockImpl::dropOwnerGroupAndPassOwnership(GroupsContainer::iterator group_
         readers_queue.erase(group_it);
         /// Prepare next phase
         if (!writers_queue.empty())
-        {
             wrlock_owner = writers_queue.begin();
-        }
         else
-        {
             rdlock_owner = readers_queue.begin();
-        }
     }
     else
     {
         writers_queue.erase(group_it);
         /// Prepare next phase
         if (!readers_queue.empty())
-        {
-            if (next && readers_queue.size() > 1)
-            {
-                rdlock_owner = std::next(readers_queue.begin());
-            }
-            else
-            {
-                rdlock_owner = readers_queue.begin();
-            }
-        }
+            rdlock_owner = readers_queue.begin();
         else
-        {
             wrlock_owner = writers_queue.begin();
-        }
     }
 
     if (rdlock_owner != readers_queue.end())
     {
-        rdlock_owner->cv.notify_all();
+        grantOwnershipToAllReaders();
     }
     else if (wrlock_owner != writers_queue.end())
     {
-        wrlock_owner->cv.notify_one();
+        grantOwnership(wrlock_owner);
     }
 }
+
+
+void RWLockImpl::grantOwnership(GroupsContainer::iterator group_it) noexcept
+{
+    if (!group_it->ownership)
+    {
+        group_it->ownership = true;
+        group_it->cv.notify_all();
+    }
+}
+
+
+void RWLockImpl::grantOwnershipToAllReaders() noexcept
+{
+    if (rdlock_owner != readers_queue.end())
+    {
+        size_t num_new_owners = 0;
+
+        for (;;)
+        {
+            if (!rdlock_owner->ownership)
+                ++num_new_owners;
+            grantOwnership(rdlock_owner);
+            if (std::next(rdlock_owner) == readers_queue.end())
+                break;
+            ++rdlock_owner;
+        }
+
+        /// There couldn't be more than one reader group which is not an owner.
+        /// (Because we add a new reader group only if the last reader group is already an owner - see the `can_use_last_group` variable.)
+        chassert(num_new_owners <= 1);
+    }
+}
+
+
+std::unordered_map<String, size_t> RWLockImpl::getOwnerQueryIds() const
+{
+    std::lock_guard lock{internal_state_mtx};
+    return owner_queries;
+}
+
+
+String RWLockImpl::getOwnerQueryIdsDescription() const
+{
+    auto map = getOwnerQueryIds();
+    WriteBufferFromOwnString out;
+    bool need_comma = false;
+    for (const auto & [query_id, num_owners] : map)
+    {
+        if (need_comma)
+            out << ", ";
+        out << query_id;
+        if (num_owners != 1)
+            out << " (" << num_owners << ")";
+        need_comma = true;
+    }
+    return out.str();
+}
+
 }
diff --git a/src/Common/RWLock.h b/src/Common/RWLock.h
index 156e4297d81..1eb6964a991 100644
--- a/src/Common/RWLock.h
+++ b/src/Common/RWLock.h
@@ -62,35 +62,42 @@ public:
     inline static const String NO_QUERY = String();
     inline static const auto default_locking_timeout_ms = std::chrono::milliseconds(120000);
 
+    /// Returns all query_id owning locks (both read and write) right now.
+    /// !! This function are for debugging and logging purposes only, DO NOT use them for synchronization!
+    std::unordered_map<String, size_t> getOwnerQueryIds() const;
+    String getOwnerQueryIdsDescription() const;
+
 private:
     /// Group of locking requests that should be granted simultaneously
     /// i.e. one or several readers or a single writer
     struct Group
     {
         const Type type;
-        size_t requests;
+        size_t requests = 0;
 
+        bool ownership = false; /// whether this group got ownership? (that means `cv` is notified and the locking requests should stop waiting)
         std::condition_variable cv; /// all locking requests of the group wait on this condvar
 
-        explicit Group(Type type_) : type{type_}, requests{0} {}
+        explicit Group(Type type_) : type{type_} {}
     };
 
     using GroupsContainer = std::list<Group>;
-    using OwnerQueryIds = std::unordered_map<String, size_t>;
+    using OwnerQueryIds = std::unordered_map<String /* query_id */, size_t /* num_owners */>;
 
     mutable std::mutex internal_state_mtx;
 
     GroupsContainer readers_queue;
     GroupsContainer writers_queue;
-    GroupsContainer::iterator rdlock_owner{readers_queue.end()};  /// equals to readers_queue.begin() in read phase
-                                                                  /// or readers_queue.end() otherwise
+    GroupsContainer::iterator rdlock_owner{readers_queue.end()};  /// last group with ownership in readers_queue in read phase
+                                                                  /// or readers_queue.end() in writer phase
     GroupsContainer::iterator wrlock_owner{writers_queue.end()};  /// equals to writers_queue.begin() in write phase
-                                                                  /// or writers_queue.end() otherwise
+                                                                  /// or writers_queue.end() in read phase
     OwnerQueryIds owner_queries;
 
     RWLockImpl() = default;
     void unlock(GroupsContainer::iterator group_it, const String & query_id) noexcept;
-    /// @param next - notify next after begin, used on writer lock failures
-    void dropOwnerGroupAndPassOwnership(GroupsContainer::iterator group_it, bool next) noexcept;
+    void dropOwnerGroupAndPassOwnership(GroupsContainer::iterator group_it) noexcept;
+    void grantOwnership(GroupsContainer::iterator group_it) noexcept;
+    void grantOwnershipToAllReaders() noexcept;
 };
 }
diff --git a/src/Common/SensitiveDataMasker.cpp b/src/Common/SensitiveDataMasker.cpp
index c4d6952f31d..2b21c223bd8 100644
--- a/src/Common/SensitiveDataMasker.cpp
+++ b/src/Common/SensitiveDataMasker.cpp
@@ -1,6 +1,5 @@
 #include "SensitiveDataMasker.h"
 
-#include <mutex>
 #include <set>
 #include <string>
 #include <atomic>
@@ -95,28 +94,20 @@ public:
 SensitiveDataMasker::~SensitiveDataMasker() = default;
 
 std::unique_ptr<SensitiveDataMasker> SensitiveDataMasker::sensitive_data_masker = nullptr;
-std::mutex SensitiveDataMasker::instance_mutex;
 
 void SensitiveDataMasker::setInstance(std::unique_ptr<SensitiveDataMasker> sensitive_data_masker_)
 {
-
     if (!sensitive_data_masker_)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: the 'sensitive_data_masker' is not set");
 
-    std::lock_guard lock(instance_mutex);
     if (sensitive_data_masker_->rulesCount() > 0)
     {
         sensitive_data_masker = std::move(sensitive_data_masker_);
     }
-    else
-    {
-        sensitive_data_masker.reset();
-    }
 }
 
 SensitiveDataMasker * SensitiveDataMasker::getInstance()
 {
-    std::lock_guard lock(instance_mutex);
     return sensitive_data_masker.get();
 }
 
diff --git a/src/Common/SensitiveDataMasker.h b/src/Common/SensitiveDataMasker.h
index abb613043d1..de5cc125dcc 100644
--- a/src/Common/SensitiveDataMasker.h
+++ b/src/Common/SensitiveDataMasker.h
@@ -1,7 +1,6 @@
 #pragma once
 
 #include <memory>
-#include <mutex>
 #include <vector>
 #include <cstdint>
 
@@ -46,7 +45,6 @@ class SensitiveDataMasker
 private:
     class MaskingRule;
     std::vector<std::unique_ptr<MaskingRule>> all_masking_rules;
-    static std::mutex instance_mutex;
     static std::unique_ptr<SensitiveDataMasker> sensitive_data_masker;
 
 public:
diff --git a/src/Common/ShellCommand.cpp b/src/Common/ShellCommand.cpp
index 5550b68c824..f4efc9e3526 100644
--- a/src/Common/ShellCommand.cpp
+++ b/src/Common/ShellCommand.cpp
@@ -145,7 +145,7 @@ std::unique_ptr<ShellCommand> ShellCommand::executeImpl(
 #endif
 
     if (!real_vfork)
-        throwFromErrno("Cannot find symbol vfork in myself", ErrorCodes::CANNOT_DLSYM);
+        throw ErrnoException(ErrorCodes::CANNOT_DLSYM, "Cannot find symbol vfork in myself");
 
     PipeFDs pipe_stdin;
     PipeFDs pipe_stdout;
@@ -163,7 +163,7 @@ std::unique_ptr<ShellCommand> ShellCommand::executeImpl(
     pid_t pid = reinterpret_cast<pid_t(*)()>(real_vfork)();
 
     if (pid == -1)
-        throwFromErrno("Cannot vfork", ErrorCodes::CANNOT_FORK);
+        throw ErrnoException(ErrorCodes::CANNOT_FORK, "Cannot vfork");
 
     if (0 == pid)
     {
@@ -305,7 +305,7 @@ int ShellCommand::tryWait()
     while (waitpid(pid, &status, 0) < 0)
     {
         if (errno != EINTR)
-            throwFromErrno("Cannot waitpid", ErrorCodes::CANNOT_WAITPID);
+            throw ErrnoException(ErrorCodes::CANNOT_WAITPID, "Cannot waitpid");
     }
 
     LOG_TRACE(getLogger(), "Wait for shell command pid {} completed with status {}", pid, status);
diff --git a/src/Common/StatusFile.cpp b/src/Common/StatusFile.cpp
index a9ffce7ddf8..0a9aa2f2739 100644
--- a/src/Common/StatusFile.cpp
+++ b/src/Common/StatusFile.cpp
@@ -64,7 +64,7 @@ StatusFile::StatusFile(std::string path_, FillFunction fill_)
     fd = ::open(path.c_str(), O_WRONLY | O_CREAT | O_CLOEXEC, 0666);
 
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + path, path, ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_OPEN_FILE, path, "Cannot open file {}", path);
 
     try
     {
@@ -74,14 +74,14 @@ StatusFile::StatusFile(std::string path_, FillFunction fill_)
             if (errno == EWOULDBLOCK)
                 throw Exception(ErrorCodes::CANNOT_OPEN_FILE, "Cannot lock file {}. Another server instance in same directory is already running.", path);
             else
-                throwFromErrnoWithPath("Cannot lock file " + path, path, ErrorCodes::CANNOT_OPEN_FILE);
+                ErrnoException::throwFromPath(ErrorCodes::CANNOT_OPEN_FILE, path, "Cannot lock file {}", path);
         }
 
         if (0 != ftruncate(fd, 0))
-            throwFromErrnoWithPath("Cannot ftruncate " + path, path, ErrorCodes::CANNOT_TRUNCATE_FILE);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_TRUNCATE_FILE, path, "Cannot ftruncate file {}", path);
 
         if (0 != lseek(fd, 0, SEEK_SET))
-            throwFromErrnoWithPath("Cannot lseek " + path, path, ErrorCodes::CANNOT_SEEK_THROUGH_FILE);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, path, "Cannot lseek file {}", path);
 
         /// Write information about current server instance to the file.
         WriteBufferFromFileDescriptor out(fd, 1024);
diff --git a/src/Common/SystemLogBase.cpp b/src/Common/SystemLogBase.cpp
index a0b3d411e38..d82b582fee6 100644
--- a/src/Common/SystemLogBase.cpp
+++ b/src/Common/SystemLogBase.cpp
@@ -188,6 +188,9 @@ typename SystemLogQueue<LogElement>::Index SystemLogQueue<LogElement>::pop(std::
                                                                            bool & should_prepare_tables_anyway,
                                                                            bool & exit_this_thread)
 {
+    /// Call dtors and deallocate strings without holding the global lock
+    output.resize(0);
+
     std::unique_lock lock(mutex);
     flush_event.wait_for(lock,
         std::chrono::milliseconds(settings.flush_interval_milliseconds),
@@ -200,7 +203,6 @@ typename SystemLogQueue<LogElement>::Index SystemLogQueue<LogElement>::pop(std::
     queue_front_index += queue.size();
     // Swap with existing array from previous flush, to save memory
     // allocations.
-    output.resize(0);
     queue.swap(output);
 
     should_prepare_tables_anyway = is_force_prepare_tables;
diff --git a/src/Common/TargetSpecific.h b/src/Common/TargetSpecific.h
index fd6a57090b8..4ee29d3fc55 100644
--- a/src/Common/TargetSpecific.h
+++ b/src/Common/TargetSpecific.h
@@ -348,6 +348,25 @@ DECLARE_AVX512VBMI2_SPECIFIC_CODE(
 
 #if ENABLE_MULTITARGET_CODE && defined(__GNUC__) && defined(__x86_64__)
 
+/// NOLINTNEXTLINE
+#define MULTITARGET_FUNCTION_AVX2_SSE42(FUNCTION_HEADER, name, FUNCTION_BODY) \
+    FUNCTION_HEADER \
+    \
+    AVX2_FUNCTION_SPECIFIC_ATTRIBUTE \
+    name##AVX2 \
+    FUNCTION_BODY \
+    \
+    FUNCTION_HEADER \
+    \
+    SSE42_FUNCTION_SPECIFIC_ATTRIBUTE \
+    name##SSE42 \
+    FUNCTION_BODY \
+    \
+    FUNCTION_HEADER \
+    \
+    name \
+    FUNCTION_BODY                                                             \
+
 /// NOLINTNEXTLINE
 #define MULTITARGET_FUNCTION_AVX512BW_AVX512F_AVX2_SSE42(FUNCTION_HEADER, name, FUNCTION_BODY) \
     FUNCTION_HEADER \
@@ -381,6 +400,14 @@ DECLARE_AVX512VBMI2_SPECIFIC_CODE(
 
 #else
 
+    /// NOLINTNEXTLINE
+#define MULTITARGET_FUNCTION_AVX2_SSE42(FUNCTION_HEADER, name, FUNCTION_BODY) \
+    FUNCTION_HEADER \
+    \
+    name \
+    FUNCTION_BODY \
+
+
 /// NOLINTNEXTLINE
 #define MULTITARGET_FUNCTION_AVX512BW_AVX512F_AVX2_SSE42(FUNCTION_HEADER, name, FUNCTION_BODY) \
     FUNCTION_HEADER \
diff --git a/src/Common/TerminalSize.cpp b/src/Common/TerminalSize.cpp
index c53494fe9a0..bc5b4474384 100644
--- a/src/Common/TerminalSize.cpp
+++ b/src/Common/TerminalSize.cpp
@@ -19,12 +19,12 @@ uint16_t getTerminalWidth()
     if (isatty(STDIN_FILENO))
     {
         if (ioctl(STDIN_FILENO, TIOCGWINSZ, &terminal_size))
-            DB::throwFromErrno("Cannot obtain terminal window size (ioctl TIOCGWINSZ)", DB::ErrorCodes::SYSTEM_ERROR);
+            throw DB::ErrnoException(DB::ErrorCodes::SYSTEM_ERROR, "Cannot obtain terminal window size (ioctl TIOCGWINSZ)");
     }
     else if (isatty(STDERR_FILENO))
     {
         if (ioctl(STDERR_FILENO, TIOCGWINSZ, &terminal_size))
-            DB::throwFromErrno("Cannot obtain terminal window size (ioctl TIOCGWINSZ)", DB::ErrorCodes::SYSTEM_ERROR);
+            throw DB::ErrnoException(DB::ErrorCodes::SYSTEM_ERROR, "Cannot obtain terminal window size (ioctl TIOCGWINSZ)");
     }
     /// Default - 0.
     return terminal_size.ws_col;
diff --git a/src/Common/ThreadFuzzer.cpp b/src/Common/ThreadFuzzer.cpp
index 433b8a76dba..0868613d880 100644
--- a/src/Common/ThreadFuzzer.cpp
+++ b/src/Common/ThreadFuzzer.cpp
@@ -258,10 +258,10 @@ void ThreadFuzzer::setup() const
 
 #if defined(OS_LINUX)
     if (sigemptyset(&sa.sa_mask))
-        throwFromErrno("Failed to clean signal mask for thread fuzzer", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+        throw ErrnoException(ErrorCodes::CANNOT_MANIPULATE_SIGSET, "Failed to clean signal mask for thread fuzzer");
 
     if (sigaddset(&sa.sa_mask, SIGPROF))
-        throwFromErrno("Failed to add signal to mask for thread fuzzer", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+        throw ErrnoException(ErrorCodes::CANNOT_MANIPULATE_SIGSET, "Failed to add signal to mask for thread fuzzer");
 #else
     // the two following functions always return 0 under mac
     sigemptyset(&sa.sa_mask);
@@ -269,7 +269,7 @@ void ThreadFuzzer::setup() const
 #endif
 
     if (sigaction(SIGPROF, &sa, nullptr))
-        throwFromErrno("Failed to setup signal handler for thread fuzzer", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Failed to setup signal handler for thread fuzzer");
 
     static constexpr UInt32 timer_precision = 1000000;
 
@@ -280,7 +280,7 @@ void ThreadFuzzer::setup() const
     struct itimerval timer = {.it_interval = interval, .it_value = interval};
 
     if (0 != setitimer(ITIMER_PROF, &timer, nullptr))
-        throwFromErrno("Failed to create profiling timer", ErrorCodes::CANNOT_CREATE_TIMER);
+        throw ErrnoException(ErrorCodes::CANNOT_CREATE_TIMER, "Failed to create profiling timer");
 }
 
 
diff --git a/src/Common/ThreadPool.cpp b/src/Common/ThreadPool.cpp
index 8cba13373b9..3c2e6228421 100644
--- a/src/Common/ThreadPool.cpp
+++ b/src/Common/ThreadPool.cpp
@@ -28,6 +28,40 @@ namespace CurrentMetrics
     extern const Metric GlobalThreadScheduled;
 }
 
+class JobWithPriority
+{
+public:
+    using Job = std::function<void()>;
+
+    Job job;
+    Priority priority;
+    CurrentMetrics::Increment metric_increment;
+    DB::OpenTelemetry::TracingContextOnThread thread_trace_context;
+
+    /// Call stacks of all jobs' schedulings leading to this one
+    std::vector<StackTrace::FramePointers> frame_pointers;
+    bool enable_job_stack_trace = false;
+
+    JobWithPriority(
+        Job job_, Priority priority_, CurrentMetrics::Metric metric,
+        const DB::OpenTelemetry::TracingContextOnThread & thread_trace_context_,
+        bool capture_frame_pointers)
+        : job(job_), priority(priority_), metric_increment(metric),
+        thread_trace_context(thread_trace_context_), enable_job_stack_trace(capture_frame_pointers)
+    {
+        if (!capture_frame_pointers)
+            return;
+        /// Save all previous jobs call stacks and append with current
+        frame_pointers = DB::Exception::thread_frame_pointers;
+        frame_pointers.push_back(StackTrace().getFramePointers());
+    }
+
+    bool operator<(const JobWithPriority & rhs) const
+    {
+        return priority > rhs.priority; // Reversed for `priority_queue` max-heap to yield minimum value (i.e. highest priority) first
+    }
+};
+
 static constexpr auto DEFAULT_THREAD_NAME = "ThreadPool";
 
 template <typename Thread>
@@ -500,3 +534,10 @@ GlobalThreadPool & GlobalThreadPool::instance()
 
     return *the_instance;
 }
+void GlobalThreadPool::shutdown()
+{
+    if (the_instance)
+    {
+        the_instance->finalize();
+    }
+}
diff --git a/src/Common/ThreadPool.h b/src/Common/ThreadPool.h
index c8eefedd838..31e4eabf63b 100644
--- a/src/Common/ThreadPool.h
+++ b/src/Common/ThreadPool.h
@@ -20,9 +20,10 @@
 #include <Common/ThreadPool_fwd.h>
 #include <Common/Priority.h>
 #include <Common/StackTrace.h>
-#include <Common/Exception.h>
 #include <base/scope_guard.h>
 
+class JobWithPriority;
+
 /** Very simple thread pool similar to boost::threadpool.
   * Advantages:
   * - catches exceptions and rethrows on wait.
@@ -109,6 +110,8 @@ public:
     void addOnDestroyCallback(OnDestroyCallback && callback);
 
 private:
+    friend class GlobalThreadPool;
+
     mutable std::mutex mutex;
     std::condition_variable job_finished;
     std::condition_variable new_job_or_shutdown;
@@ -126,37 +129,6 @@ private:
     bool threads_remove_themselves = true;
     const bool shutdown_on_exception = true;
 
-    struct JobWithPriority
-    {
-        Job job;
-        Priority priority;
-        CurrentMetrics::Increment metric_increment;
-        DB::OpenTelemetry::TracingContextOnThread thread_trace_context;
-
-        /// Call stacks of all jobs' schedulings leading to this one
-        std::vector<StackTrace::FramePointers> frame_pointers;
-        bool enable_job_stack_trace = false;
-
-        JobWithPriority(
-            Job job_, Priority priority_, CurrentMetrics::Metric metric,
-            const DB::OpenTelemetry::TracingContextOnThread & thread_trace_context_,
-            bool capture_frame_pointers)
-            : job(job_), priority(priority_), metric_increment(metric),
-            thread_trace_context(thread_trace_context_), enable_job_stack_trace(capture_frame_pointers)
-        {
-            if (!capture_frame_pointers)
-                return;
-            /// Save all previous jobs call stacks and append with current
-            frame_pointers = DB::Exception::thread_frame_pointers;
-            frame_pointers.push_back(StackTrace().getFramePointers());
-        }
-
-        bool operator<(const JobWithPriority & rhs) const
-        {
-            return priority > rhs.priority; // Reversed for `priority_queue` max-heap to yield minimum value (i.e. highest priority) first
-        }
-    };
-
     boost::heap::priority_queue<JobWithPriority> jobs;
     std::list<Thread> threads;
     std::exception_ptr first_exception;
@@ -205,6 +177,7 @@ class GlobalThreadPool : public FreeThreadPool, private boost::noncopyable
 public:
     static void initialize(size_t max_threads = 10000, size_t max_free_threads = 1000, size_t queue_size = 10000);
     static GlobalThreadPool & instance();
+    static void shutdown();
 };
 
 
diff --git a/src/Common/ThreadStatus.cpp b/src/Common/ThreadStatus.cpp
index 101a56cd620..c99823b2dfa 100644
--- a/src/Common/ThreadStatus.cpp
+++ b/src/Common/ThreadStatus.cpp
@@ -4,6 +4,7 @@
 #include <Common/ThreadStatus.h>
 #include <Common/CurrentThread.h>
 #include <Common/logger_useful.h>
+#include <base/getPageSize.h>
 #include <base/errnoToString.h>
 #include <Interpreters/Context.h>
 
diff --git a/src/Common/TimerDescriptor.cpp b/src/Common/TimerDescriptor.cpp
index 2fb9618b60a..248febe226e 100644
--- a/src/Common/TimerDescriptor.cpp
+++ b/src/Common/TimerDescriptor.cpp
@@ -24,7 +24,7 @@ TimerDescriptor::TimerDescriptor(int clockid, int flags)
         throw Exception(ErrorCodes::CANNOT_CREATE_TIMER, "Cannot create timer_fd descriptor");
 
     if (-1 == fcntl(timer_fd, F_SETFL, O_NONBLOCK))
-        throwFromErrno("Cannot set O_NONBLOCK for timer_fd", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot set O_NONBLOCK for timer_fd");
 }
 
 TimerDescriptor::TimerDescriptor(TimerDescriptor && other) noexcept : timer_fd(other.timer_fd)
@@ -57,7 +57,7 @@ void TimerDescriptor::reset() const
     spec.it_value.tv_nsec = 0;
 
     if (-1 == timerfd_settime(timer_fd, 0 /*relative timer */, &spec, nullptr))
-        throwFromErrno("Cannot reset timer_fd", ErrorCodes::CANNOT_SET_TIMER_PERIOD);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_TIMER_PERIOD, "Cannot reset timer_fd");
 
     /// Drain socket.
     /// It may be possible that alarm happened and socket is readable.
@@ -78,7 +78,7 @@ void TimerDescriptor::drain() const
                 break;
 
             if (errno != EINTR)
-                throwFromErrno("Cannot drain timer_fd", ErrorCodes::CANNOT_READ_FROM_SOCKET);
+                throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_SOCKET, "Cannot drain timer_fd");
         }
     }
 }
@@ -94,7 +94,7 @@ void TimerDescriptor::setRelative(uint64_t usec) const
     spec.it_value.tv_nsec = (usec % TIMER_PRECISION) * 1'000;
 
     if (-1 == timerfd_settime(timer_fd, 0 /*relative timer */, &spec, nullptr))
-        throwFromErrno("Cannot set time for timer_fd", ErrorCodes::CANNOT_SET_TIMER_PERIOD);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_TIMER_PERIOD, "Cannot set time for timer_fd");
 }
 
 void TimerDescriptor::setRelative(Poco::Timespan timespan) const
diff --git a/src/Common/ZooKeeper/IKeeper.cpp b/src/Common/ZooKeeper/IKeeper.cpp
index f2e4b321326..6c47ea68b84 100644
--- a/src/Common/ZooKeeper/IKeeper.cpp
+++ b/src/Common/ZooKeeper/IKeeper.cpp
@@ -144,6 +144,7 @@ const char * errorMessage(Error code)
         case Error::ZCLOSING:                 return "ZooKeeper is closing";
         case Error::ZNOTHING:                 return "(not error) no server responses to process";
         case Error::ZSESSIONMOVED:            return "Session moved to another server, so operation is ignored";
+        case Error::ZNOTREADONLY:             return "State-changing request is passed to read-only server";
     }
 
     UNREACHABLE();
@@ -156,7 +157,8 @@ bool isHardwareError(Error zk_return_code)
         || zk_return_code == Error::ZSESSIONMOVED
         || zk_return_code == Error::ZCONNECTIONLOSS
         || zk_return_code == Error::ZMARSHALLINGERROR
-        || zk_return_code == Error::ZOPERATIONTIMEOUT;
+        || zk_return_code == Error::ZOPERATIONTIMEOUT
+        || zk_return_code == Error::ZNOTREADONLY;
 }
 
 bool isUserError(Error zk_return_code)
@@ -196,4 +198,3 @@ void MultiResponse::removeRootPath(const String & root_path)
 }
 
 }
-
diff --git a/src/Common/ZooKeeper/IKeeper.h b/src/Common/ZooKeeper/IKeeper.h
index 6d6f8afbaee..76cdfe9f230 100644
--- a/src/Common/ZooKeeper/IKeeper.h
+++ b/src/Common/ZooKeeper/IKeeper.h
@@ -109,7 +109,8 @@ enum class Error : int32_t
     ZAUTHFAILED = -115,                 /// Client authentication failed
     ZCLOSING = -116,                    /// ZooKeeper is closing
     ZNOTHING = -117,                    /// (not error) no server responses to process
-    ZSESSIONMOVED = -118                /// Session moved to another server, so operation is ignored
+    ZSESSIONMOVED = -118,               /// Session moved to another server, so operation is ignored
+    ZNOTREADONLY = -119,                /// State-changing request is passed to read-only server
 };
 
 /// Network errors and similar. You should reinitialize ZooKeeper session in case of these errors
@@ -445,6 +446,7 @@ enum State
     CONNECTING = 1,
     ASSOCIATING = 2,
     CONNECTED = 3,
+    READONLY = 5,
     NOTCONNECTED = 999
 };
 
@@ -469,7 +471,7 @@ private:
     /// Message must be a compile-time constant
     template <typename T>
     requires std::is_convertible_v<T, String>
-    Exception(T && message, const Error code_) : DB::Exception(DB::ErrorCodes::KEEPER_EXCEPTION, std::forward<T>(message)), code(code_)
+    Exception(T && message, const Error code_) : DB::Exception(std::forward<T>(message), DB::ErrorCodes::KEEPER_EXCEPTION, /* remote_= */ false), code(code_)
     {
         incrementErrorMetrics(code);
     }
diff --git a/src/Common/ZooKeeper/TestKeeper.cpp b/src/Common/ZooKeeper/TestKeeper.cpp
index a19892736ea..a25329ad7c0 100644
--- a/src/Common/ZooKeeper/TestKeeper.cpp
+++ b/src/Common/ZooKeeper/TestKeeper.cpp
@@ -99,6 +99,7 @@ struct TestKeeperExistsRequest final : ExistsRequest, TestKeeperRequest
 struct TestKeeperGetRequest final : GetRequest, TestKeeperRequest
 {
     TestKeeperGetRequest() = default;
+    explicit TestKeeperGetRequest(const GetRequest & base) : GetRequest(base) {}
     ResponsePtr createResponse() const override;
     std::pair<ResponsePtr, Undo> process(TestKeeper::Container & container, int64_t zxid) const override;
 };
@@ -118,6 +119,8 @@ struct TestKeeperSetRequest final : SetRequest, TestKeeperRequest
 
 struct TestKeeperListRequest : ListRequest, TestKeeperRequest
 {
+    TestKeeperListRequest() = default;
+    explicit TestKeeperListRequest(const ListRequest & base) : ListRequest(base) {}
     ResponsePtr createResponse() const override;
     std::pair<ResponsePtr, Undo> process(TestKeeper::Container & container, int64_t zxid) const override;
 };
@@ -176,6 +179,14 @@ struct TestKeeperMultiRequest final : MultiRequest, TestKeeperRequest
             {
                 requests.push_back(std::make_shared<TestKeeperCheckRequest>(*concrete_request_check));
             }
+            else if (const auto * concrete_request_get = dynamic_cast<const GetRequest *>(generic_request.get()))
+            {
+                requests.push_back(std::make_shared<TestKeeperGetRequest>(*concrete_request_get));
+            }
+            else if (const auto * concrete_request_list = dynamic_cast<const ListRequest *>(generic_request.get()))
+            {
+                requests.push_back(std::make_shared<TestKeeperListRequest>(*concrete_request_list));
+            }
             else
                 throw Exception::fromMessage(Error::ZBADARGUMENTS, "Illegal command as part of multi ZooKeeper request");
         }
diff --git a/src/Common/ZooKeeper/ZooKeeper.cpp b/src/Common/ZooKeeper/ZooKeeper.cpp
index 436a4e14f14..70b8df5cd2c 100644
--- a/src/Common/ZooKeeper/ZooKeeper.cpp
+++ b/src/Common/ZooKeeper/ZooKeeper.cpp
@@ -323,6 +323,9 @@ Coordination::Error ZooKeeper::tryCreate(const std::string & path, const std::st
 {
     Coordination::Error code = createImpl(path, data, mode, path_created);
 
+    if (code == Coordination::Error::ZNOTREADONLY && exists(path))
+        return Coordination::Error::ZNODEEXISTS;
+
     if (!(code == Coordination::Error::ZOK ||
           code == Coordination::Error::ZNONODE ||
           code == Coordination::Error::ZNODEEXISTS ||
@@ -345,6 +348,8 @@ void ZooKeeper::createIfNotExists(const std::string & path, const std::string &
 
     if (code == Coordination::Error::ZOK || code == Coordination::Error::ZNODEEXISTS)
         return;
+    else if (code == Coordination::Error::ZNOTREADONLY && exists(path))
+        return;
     else
         throw KeeperException::fromPath(code, path);
 }
@@ -492,6 +497,17 @@ bool ZooKeeper::exists(const std::string & path, Coordination::Stat * stat, cons
     return existsWatch(path, stat, callbackForEvent(watch));
 }
 
+bool ZooKeeper::anyExists(const std::vector<std::string> & paths)
+{
+    auto exists_multi_response = exists(paths);
+    for (size_t i = 0; i < exists_multi_response.size(); ++i)
+    {
+        if (exists_multi_response[i].error == Coordination::Error::ZOK)
+            return true;
+    }
+    return false;
+}
+
 bool ZooKeeper::existsWatch(const std::string & path, Coordination::Stat * stat, Coordination::WatchCallback watch_callback)
 {
     Coordination::Error code = existsImpl(path, stat, watch_callback);
@@ -853,7 +869,7 @@ bool ZooKeeper::waitForDisappear(const std::string & path, const WaitCondition &
     /// method is called.
     do
     {
-        /// Use getData insteand of exists to avoid watch leak.
+        /// Use getData instead of exists to avoid watch leak.
         impl->get(path, callback, std::make_shared<Coordination::WatchCallback>(watch));
 
         if (!state->event.tryWait(1000))
@@ -872,7 +888,7 @@ bool ZooKeeper::waitForDisappear(const std::string & path, const WaitCondition &
     return false;
 }
 
-void ZooKeeper::handleEphemeralNodeExistence(const std::string & path, const std::string & fast_delete_if_equal_value)
+void ZooKeeper::deleteEphemeralNodeIfContentMatches(const std::string & path, const std::string & fast_delete_if_equal_value)
 {
     zkutil::EventPtr eph_node_disappeared = std::make_shared<Poco::Event>();
     String content;
@@ -1159,6 +1175,7 @@ std::future<Coordination::RemoveResponse> ZooKeeper::asyncRemove(const std::stri
     return future;
 }
 
+/// Needs to match ZooKeeperWithInjection::asyncTryRemove implementation
 std::future<Coordination::RemoveResponse> ZooKeeper::asyncTryRemove(const std::string & path, int32_t version)
 {
     auto promise = std::make_shared<std::promise<Coordination::RemoveResponse>>();
diff --git a/src/Common/ZooKeeper/ZooKeeper.h b/src/Common/ZooKeeper/ZooKeeper.h
index 785842b94bd..1f29af0797b 100644
--- a/src/Common/ZooKeeper/ZooKeeper.h
+++ b/src/Common/ZooKeeper/ZooKeeper.h
@@ -33,7 +33,8 @@ namespace CurrentMetrics
 
 namespace DB
 {
-    class ZooKeeperLog;
+class ZooKeeperLog;
+class ZooKeeperWithFaultInjection;
 
 namespace ErrorCodes
 {
@@ -194,6 +195,9 @@ private:
 /// Methods with names not starting at try- raise KeeperException on any error.
 class ZooKeeper
 {
+    /// ZooKeeperWithFaultInjection wants access to `impl` pointer to reimplement some async functions with faults
+    friend class DB::ZooKeeperWithFaultInjection;
+
 public:
 
     using Ptr = std::shared_ptr<ZooKeeper>;
@@ -286,6 +290,8 @@ public:
         return exists(paths.begin(), paths.end());
     }
 
+    bool anyExists(const std::vector<std::string> & paths);
+
     std::string get(const std::string & path, Coordination::Stat * stat = nullptr, const EventPtr & watch = nullptr);
     std::string getWatch(const std::string & path, Coordination::Stat * stat, Coordination::WatchCallback watch_callback);
 
@@ -422,8 +428,9 @@ public:
     /// Performs several operations in a transaction.
     /// Throws on every error.
     Coordination::Responses multi(const Coordination::Requests & requests);
-    /// Throws only if some operation has returned an "unexpected" error
-    /// - an error that would cause the corresponding try- method to throw.
+    /// Throws only if some operation has returned an "unexpected" error - an error that would cause
+    /// the corresponding try- method to throw.
+    /// On exception, `responses` may or may not be populated.
     Coordination::Error tryMulti(const Coordination::Requests & requests, Coordination::Responses & responses);
     /// Throws nothing (even session expired errors)
     Coordination::Error tryMultiNoThrow(const Coordination::Requests & requests, Coordination::Responses & responses);
@@ -467,7 +474,7 @@ public:
     /// If the node exists and its value is equal to fast_delete_if_equal_value it will remove it
     /// If the node exists and its value is different, it will wait for it to disappear. It will throw a LOGICAL_ERROR if the node doesn't
     /// disappear automatically after 3x session_timeout.
-    void handleEphemeralNodeExistence(const std::string & path, const std::string & fast_delete_if_equal_value);
+    void deleteEphemeralNodeIfContentMatches(const std::string & path, const std::string & fast_delete_if_equal_value);
 
     Coordination::ReconfigResponse reconfig(
         const std::string & joining,
@@ -567,8 +574,11 @@ public:
     void setZooKeeperLog(std::shared_ptr<DB::ZooKeeperLog> zk_log_);
 
     UInt32 getSessionUptime() const { return static_cast<UInt32>(session_uptime.elapsedSeconds()); }
+
     bool hasReachedDeadline() const { return impl->hasReachedDeadline(); }
 
+    uint64_t getSessionTimeoutMS() const { return args.session_timeout_ms; }
+
     void setServerCompletelyStarted();
 
     Int8 getConnectedHostIdx() const;
@@ -640,8 +650,6 @@ private:
 
     ZooKeeperArgs args;
 
-    std::mutex mutex;
-
     Poco::Logger * log = nullptr;
     std::shared_ptr<DB::ZooKeeperLog> zk_log;
 
diff --git a/src/Common/ZooKeeper/ZooKeeperConstants.h b/src/Common/ZooKeeper/ZooKeeperConstants.h
index 1a868963b57..a5c1d21eda6 100644
--- a/src/Common/ZooKeeper/ZooKeeperConstants.h
+++ b/src/Common/ZooKeeper/ZooKeeperConstants.h
@@ -51,6 +51,7 @@ static constexpr int32_t KEEPER_PROTOCOL_VERSION_CONNECTION_REJECT = 42;
 static constexpr int32_t CLIENT_HANDSHAKE_LENGTH = 44;
 static constexpr int32_t CLIENT_HANDSHAKE_LENGTH_WITH_READONLY = 45;
 static constexpr int32_t SERVER_HANDSHAKE_LENGTH = 36;
+static constexpr int32_t SERVER_HANDSHAKE_LENGTH_WITH_READONLY = 37;
 static constexpr int32_t PASSWORD_LENGTH = 16;
 
 /// ZooKeeper has 1 MB node size and serialization limit by default,
diff --git a/src/Common/ZooKeeper/ZooKeeperImpl.cpp b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
index 4335ea4655f..d732b900d37 100644
--- a/src/Common/ZooKeeper/ZooKeeperImpl.cpp
+++ b/src/Common/ZooKeeper/ZooKeeperImpl.cpp
@@ -1,3 +1,5 @@
+#include <Common/ZooKeeper/ZooKeeperConstants.h>
+#include <Common/thread_local_rng.h>
 #include <Common/ZooKeeper/ZooKeeperImpl.h>
 
 #include <IO/Operators.h>
@@ -552,12 +554,13 @@ void ZooKeeper::connect(
 
 void ZooKeeper::sendHandshake()
 {
-    int32_t handshake_length = 44;
+    int32_t handshake_length = 45;
     int64_t last_zxid_seen = 0;
     int32_t timeout = args.session_timeout_ms;
     int64_t previous_session_id = 0;    /// We don't support session restore. So previous session_id is always zero.
     constexpr int32_t passwd_len = 16;
     std::array<char, passwd_len> passwd {};
+    bool read_only = true;
 
     write(handshake_length);
     if (use_compression)
@@ -568,6 +571,7 @@ void ZooKeeper::sendHandshake()
     write(timeout);
     write(previous_session_id);
     write(passwd);
+    write(read_only);
     flushWriteBuffer();
 }
 
@@ -577,9 +581,10 @@ void ZooKeeper::receiveHandshake()
     int32_t protocol_version_read;
     int32_t timeout;
     std::array<char, PASSWORD_LENGTH> passwd;
+    bool read_only;
 
     read(handshake_length);
-    if (handshake_length != SERVER_HANDSHAKE_LENGTH)
+    if (handshake_length != SERVER_HANDSHAKE_LENGTH && handshake_length != SERVER_HANDSHAKE_LENGTH_WITH_READONLY)
         throw Exception(Error::ZMARSHALLINGERROR, "Unexpected handshake length received: {}", handshake_length);
 
     read(protocol_version_read);
@@ -607,6 +612,8 @@ void ZooKeeper::receiveHandshake()
 
     read(session_id);
     read(passwd);
+    if (handshake_length == SERVER_HANDSHAKE_LENGTH_WITH_READONLY)
+        read(read_only);
 }
 
 
diff --git a/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.cpp b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.cpp
new file mode 100644
index 00000000000..72923ca0487
--- /dev/null
+++ b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.cpp
@@ -0,0 +1,637 @@
+#include <base/defines.h>
+#include <Common/ZooKeeper/ZooKeeperWithFaultInjection.h>
+
+namespace DB
+{
+
+ZooKeeperWithFaultInjection::ZooKeeperWithFaultInjection(
+    zkutil::ZooKeeper::Ptr const & keeper_,
+    double fault_injection_probability,
+    UInt64 fault_injection_seed,
+    std::string name_,
+    Poco::Logger * logger_)
+    : keeper(keeper_)
+    , fault_policy(std::make_unique<RandomFaultInjection>(fault_injection_probability, fault_injection_seed))
+    , name(std::move(name_))
+    , logger(logger_)
+    , seed(fault_injection_seed)
+{
+}
+
+void ZooKeeperWithFaultInjection::resetKeeper()
+{
+    /// When an error is injected, we need to reset keeper for several reasons
+    /// a) Avoid processing further requests in this keeper (in async code)
+    /// b) Simulate a fault as ZooKeeperImpl does, forcing a new session (which drops ephemeral nodes)
+    ///
+    /// Ideally we would call `keeper->finalize("Fault injection");` to force the session reload.
+    /// The problem with that is that many operations currently aren't able to cope with keeper faults correctly,
+    /// so they would fail. While this is what happens in production, it's not what we want in the CI.
+    ///
+    /// Until all the code can handle keeper session resets, we need to simulate it so the code that relies on its
+    /// behaviour keeps working. An example of such code is insert block ids: If keeper dies between the block id being
+    /// reserved (via ephemeral node) and the metadata being pushed, the reserved block id will be deleted automatically
+    /// in keeper (connection drop == delete all ephemeral nodes attached to that connection). This way retrying and
+    /// getting a new block id is ok. But without a connection reset (because ZooKeeperWithFaultInjection doesn't
+    /// enforce it yet), the old ephemeral nodes associated with "committing_blocks" will still be there and operations
+    /// such as block merges, mutations, etc., will think they are alive and wait for them to be ready (which will never
+    /// happen)
+    /// Our poor man session reload is to keep track of ephemeral nodes created by this Faulty keeper and delete
+    /// them manually when we force a fault. This is obviously limited as it will only apply for operations processed by
+    /// this instance, but let's trust more and more code can handle session reloads and we can eliminate the hack.
+    /// Until that time, the hack remains.
+    if (keeper)
+    {
+        for (const auto & path_created : session_ephemeral_nodes)
+        {
+            try
+            {
+                keeper->remove(path_created);
+            }
+            catch (const Coordination::Exception & e)
+            {
+                if (logger)
+                    LOG_TRACE(logger, "Failed to delete ephemeral node ({}) during fault cleanup: {}", path_created, e.what());
+            }
+        }
+    }
+
+    session_ephemeral_nodes.clear();
+    keeper.reset();
+}
+
+void ZooKeeperWithFaultInjection::multiResponseSaveEphemeralNodePaths(
+    const Coordination::Requests & requests, const Coordination::Responses & responses)
+{
+    if (responses.empty())
+        return;
+
+    chassert(requests.size() == responses.size());
+
+    for (size_t i = 0; i < requests.size(); i++)
+    {
+        const auto * create_req = dynamic_cast<const Coordination::CreateRequest *>(requests[i].get());
+        if (create_req && create_req->is_ephemeral)
+        {
+            const auto * create_resp = dynamic_cast<const Coordination::CreateResponse *>(responses.at(i).get());
+            chassert(create_resp);
+            session_ephemeral_nodes.emplace_back(create_resp->path_created);
+        }
+    }
+}
+
+void ZooKeeperWithFaultInjection::injectFailureBeforeOperationThrow(const char * func_name, const String & path)
+{
+    if (unlikely(!keeper))
+    {
+        /// This is ok for async requests, where you call several of them and one introduced a fault
+        /// In the faults we reset the pointer to mark the connection as failed and inject failures in any
+        /// subsequent async requests
+        if (logger)
+            LOG_TRACE(logger, "ZooKeeperWithFaultInjection called after fault: seed={}, func={} path={}", seed, func_name, path);
+        throw zkutil::KeeperException::fromMessage(RandomFaultInjection::error_before_op, RandomFaultInjection::msg_session_expired);
+    }
+
+    if (unlikely(fault_policy) && fault_policy->beforeOperation())
+    {
+        if (logger)
+            LOG_TRACE(
+                logger,
+                "ZooKeeperWithFaultInjection call FAILED: seed={} func={} path={} code={} message={} ",
+                seed,
+                func_name,
+                path,
+                RandomFaultInjection::error_before_op,
+                RandomFaultInjection::msg_before_op);
+        resetKeeper();
+        throw zkutil::KeeperException::fromMessage(RandomFaultInjection::error_before_op, RandomFaultInjection::msg_before_op);
+    }
+}
+
+void ZooKeeperWithFaultInjection::injectFailureAfterOperationThrow(const char * func_name, const String & path)
+{
+    if (unlikely(fault_policy) && fault_policy->afterOperation())
+    {
+        if (logger)
+            LOG_TRACE(
+                logger,
+                "ZooKeeperWithFaultInjection call FAILED: seed={} func={} path={} code={} message={} ",
+                seed,
+                func_name,
+                path,
+                RandomFaultInjection::error_after_op,
+                RandomFaultInjection::msg_after_op);
+        resetKeeper();
+        throw zkutil::KeeperException::fromMessage(RandomFaultInjection::error_after_op, RandomFaultInjection::msg_after_op);
+    }
+}
+
+
+template <typename Operation>
+std::invoke_result_t<Operation>
+ZooKeeperWithFaultInjection::executeWithFaultSync(const char * func_name, const std::string & path, Operation operation)
+{
+    injectFailureBeforeOperationThrow(func_name, path);
+
+    if constexpr (!std::is_same_v<std::invoke_result_t<Operation>, void>)
+    {
+        auto res = operation();
+        injectFailureAfterOperationThrow(func_name, path);
+        return res;
+    }
+    else
+    {
+        operation();
+        injectFailureAfterOperationThrow(func_name, path);
+    }
+}
+
+template <typename Promise>
+bool ZooKeeperWithFaultInjection::injectFailureBeforeOperationPromise(const char * func_name, Promise & promise, const String & path)
+{
+    if (unlikely(!keeper))
+    {
+        if (logger)
+            LOG_ERROR(logger, "ZooKeeperWithFaultInjection called after fault injection: seed={}, func={} path={}", seed, func_name, path);
+        promise->set_exception(std::make_exception_ptr(
+            zkutil::KeeperException::fromMessage(RandomFaultInjection::error_before_op, RandomFaultInjection::msg_session_expired)));
+    }
+
+    if (unlikely(fault_policy) && fault_policy->beforeOperation())
+    {
+        if (logger)
+            LOG_TRACE(
+                logger, "ZooKeeperWithFaultInjection injected fault before operation: seed={} func={} path={}", seed, func_name, path);
+        resetKeeper();
+        promise->set_exception(std::make_exception_ptr(
+            zkutil::KeeperException::fromMessage(RandomFaultInjection::error_before_op, RandomFaultInjection::msg_before_op)));
+        return true;
+    }
+    return false;
+}
+
+template <typename Promise>
+bool ZooKeeperWithFaultInjection::injectFailureAfterOperationPromise(const char * func_name, Promise & promise, const String & path)
+{
+    if (unlikely(fault_policy) && fault_policy->afterOperation())
+    {
+        promise->set_exception(std::make_exception_ptr(
+            zkutil::KeeperException::fromMessage(RandomFaultInjection::error_after_op, RandomFaultInjection::msg_after_op)));
+        if (logger)
+            LOG_TRACE(logger, "ZooKeeperWithFaultInjection injected fault after operation: seed={} func={} path={}", seed, func_name, path);
+        resetKeeper();
+        return true;
+    }
+    return false;
+}
+
+Strings ZooKeeperWithFaultInjection::getChildren(
+    const std::string & path, Coordination::Stat * stat, const zkutil::EventPtr & watch, Coordination::ListRequestType list_request_type)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->getChildren(path, stat, watch, list_request_type); });
+}
+
+zkutil::ZooKeeper::MultiGetChildrenResponse
+ZooKeeperWithFaultInjection::getChildren(const std::vector<std::string> & paths, Coordination::ListRequestType list_request_type)
+{
+    return executeWithFaultSync(
+        __func__, !paths.empty() ? paths.front() : "", [&]() { return keeper->getChildren(paths, list_request_type); });
+}
+
+Coordination::Error ZooKeeperWithFaultInjection::tryGetChildren(
+    const std::string & path,
+    Strings & res,
+    Coordination::Stat * stat,
+    const zkutil::EventPtr & watch,
+    Coordination::ListRequestType list_request_type)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->tryGetChildren(path, res, stat, watch, list_request_type); });
+}
+
+zkutil::ZooKeeper::MultiTryGetChildrenResponse
+ZooKeeperWithFaultInjection::tryGetChildren(const std::vector<std::string> & paths, Coordination::ListRequestType list_request_type)
+{
+    return executeWithFaultSync(
+        __func__, !paths.empty() ? paths.front() : "", [&]() { return keeper->tryGetChildren(paths, list_request_type); });
+}
+
+Coordination::Error ZooKeeperWithFaultInjection::tryGetChildrenWatch(
+    const std::string & path,
+    Strings & res,
+    Coordination::Stat * stat,
+    Coordination::WatchCallback watch_callback,
+    Coordination::ListRequestType list_request_type)
+{
+    return executeWithFaultSync(
+        __func__, path, [&]() { return keeper->tryGetChildrenWatch(path, res, stat, watch_callback, list_request_type); });
+}
+
+Strings ZooKeeperWithFaultInjection::getChildrenWatch(
+    const std::string & path,
+    Coordination::Stat * stat,
+    Coordination::WatchCallback watch_callback,
+    Coordination::ListRequestType list_request_type)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->getChildrenWatch(path, stat, watch_callback, list_request_type); });
+}
+
+Strings ZooKeeperWithFaultInjection::getChildrenWatch(
+    const std::string & path,
+    Coordination::Stat * stat,
+    Coordination::WatchCallbackPtr watch_callback,
+    Coordination::ListRequestType list_request_type)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->getChildrenWatch(path, stat, watch_callback, list_request_type); });
+}
+
+bool ZooKeeperWithFaultInjection::tryGet(
+    const std::string & path, std::string & res, Coordination::Stat * stat, const zkutil::EventPtr & watch, Coordination::Error * code)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->tryGet(path, res, stat, watch, code); });
+}
+
+bool ZooKeeperWithFaultInjection::tryGetWatch(
+    const std::string & path,
+    std::string & res,
+    Coordination::Stat * stat,
+    Coordination::WatchCallback watch_callback,
+    Coordination::Error * code)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->tryGetWatch(path, res, stat, watch_callback, code); });
+}
+
+std::string ZooKeeperWithFaultInjection::get(const std::string & path, Coordination::Stat * stat, const zkutil::EventPtr & watch)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->get(path, stat, watch); });
+}
+
+zkutil::ZooKeeper::MultiGetResponse ZooKeeperWithFaultInjection::get(const std::vector<std::string> & paths)
+{
+    return executeWithFaultSync(__func__, !paths.empty() ? paths.front() : "", [&]() { return keeper->get(paths); });
+}
+
+zkutil::ZooKeeper::MultiTryGetResponse ZooKeeperWithFaultInjection::tryGet(const std::vector<std::string> & paths)
+{
+    return executeWithFaultSync(__func__, !paths.empty() ? paths.front() : "", [&]() { return keeper->tryGet(paths); });
+}
+
+void ZooKeeperWithFaultInjection::set(const String & path, const String & data, int32_t version, Coordination::Stat * stat)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->set(path, data, version, stat); });
+}
+
+void ZooKeeperWithFaultInjection::remove(const String & path, int32_t version)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->remove(path, version); });
+}
+
+bool ZooKeeperWithFaultInjection::exists(const std::string & path, Coordination::Stat * stat, const zkutil::EventPtr & watch)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->exists(path, stat, watch); });
+}
+
+bool ZooKeeperWithFaultInjection::anyExists(const std::vector<std::string> & paths)
+{
+    return executeWithFaultSync(__func__, !paths.empty() ? paths.front() : "", [&]() { return keeper->anyExists(paths); });
+}
+
+zkutil::ZooKeeper::MultiExistsResponse ZooKeeperWithFaultInjection::exists(const std::vector<std::string> & paths)
+{
+    return executeWithFaultSync(__func__, !paths.empty() ? paths.front() : "", [&]() { return keeper->exists(paths); });
+}
+
+std::string ZooKeeperWithFaultInjection::create(const std::string & path, const std::string & data, int32_t mode)
+{
+    return executeWithFaultSync(
+        __func__,
+        path,
+        [&]()
+        {
+            auto path_created = keeper->create(path, data, mode);
+            if (unlikely(fault_policy) && (mode == zkutil::CreateMode::EphemeralSequential || mode == zkutil::CreateMode::Ephemeral))
+                session_ephemeral_nodes.emplace_back(path_created);
+            return path_created;
+        });
+}
+
+Coordination::Error
+ZooKeeperWithFaultInjection::tryCreate(const std::string & path, const std::string & data, int32_t mode, std::string & path_created)
+{
+    return executeWithFaultSync(
+        __func__,
+        path,
+        [&]()
+        {
+            Coordination::Error code = keeper->tryCreate(path, data, mode, path_created);
+            if (unlikely(fault_policy) && code == Coordination::Error::ZOK
+                && (mode == zkutil::CreateMode::EphemeralSequential || mode == zkutil::CreateMode::Ephemeral))
+                session_ephemeral_nodes.emplace_back(path_created);
+            return code;
+        });
+}
+
+Coordination::Error ZooKeeperWithFaultInjection::tryCreate(const std::string & path, const std::string & data, int32_t mode)
+{
+    std::string path_created;
+    return tryCreate(path, data, mode, path_created);
+}
+
+Coordination::Responses ZooKeeperWithFaultInjection::multi(const Coordination::Requests & requests)
+{
+    return executeWithFaultSync(
+        __func__,
+        !requests.empty() ? requests.front()->getPath() : "",
+        [&]()
+        {
+            auto responses = keeper->multi(requests);
+            if (unlikely(fault_policy))
+                multiResponseSaveEphemeralNodePaths(requests, responses);
+            return responses;
+        });
+}
+
+void ZooKeeperWithFaultInjection::createIfNotExists(const std::string & path, const std::string & data)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->createIfNotExists(path, data); });
+}
+
+void ZooKeeperWithFaultInjection::createOrUpdate(const std::string & path, const std::string & data, int32_t mode)
+{
+    chassert(mode != zkutil::CreateMode::EphemeralSequential && mode != zkutil::CreateMode::Ephemeral);
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->createOrUpdate(path, data, mode); });
+}
+
+void ZooKeeperWithFaultInjection::createAncestors(const std::string & path)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->createAncestors(path); });
+}
+
+Coordination::Error ZooKeeperWithFaultInjection::tryRemove(const std::string & path, int32_t version)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->tryRemove(path, version); });
+}
+
+void ZooKeeperWithFaultInjection::removeRecursive(const std::string & path)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->removeRecursive(path); });
+}
+
+void ZooKeeperWithFaultInjection::tryRemoveRecursive(const std::string & path)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->tryRemoveRecursive(path); });
+}
+
+void ZooKeeperWithFaultInjection::removeChildren(const std::string & path)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->removeChildren(path); });
+}
+
+bool ZooKeeperWithFaultInjection::tryRemoveChildrenRecursive(
+    const std::string & path, bool probably_flat, zkutil::RemoveException keep_child)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->tryRemoveChildrenRecursive(path, probably_flat, keep_child); });
+}
+
+bool ZooKeeperWithFaultInjection::waitForDisappear(const std::string & path, const zkutil::ZooKeeper::WaitCondition & condition)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->waitForDisappear(path, condition); });
+}
+
+std::string ZooKeeperWithFaultInjection::sync(const std::string & path)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->sync(path); });
+}
+
+Coordination::Error
+ZooKeeperWithFaultInjection::trySet(const std::string & path, const std::string & data, int32_t version, Coordination::Stat * stat)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->trySet(path, data, version, stat); });
+}
+
+void ZooKeeperWithFaultInjection::checkExistsAndGetCreateAncestorsOps(const std::string & path, Coordination::Requests & requests)
+{
+    return executeWithFaultSync(__func__, path, [&]() { return keeper->checkExistsAndGetCreateAncestorsOps(path, requests); });
+}
+
+void ZooKeeperWithFaultInjection::deleteEphemeralNodeIfContentMatches(
+    const std::string & path, const std::string & fast_delete_if_equal_value)
+{
+    return executeWithFaultSync(
+        __func__, path, [&]() { return keeper->deleteEphemeralNodeIfContentMatches(path, fast_delete_if_equal_value); });
+}
+
+Coordination::Error ZooKeeperWithFaultInjection::tryMulti(const Coordination::Requests & requests, Coordination::Responses & responses)
+{
+    return executeWithFaultSync(
+        __func__,
+        !requests.empty() ? requests.front()->getPath() : "",
+        [&]()
+        {
+            auto code = keeper->tryMulti(requests, responses);
+            if (unlikely(fault_policy) && code == Coordination::Error::ZOK)
+                multiResponseSaveEphemeralNodePaths(requests, responses);
+            return code;
+        });
+}
+
+Coordination::Error
+ZooKeeperWithFaultInjection::tryMultiNoThrow(const Coordination::Requests & requests, Coordination::Responses & responses)
+{
+    try
+    {
+        return tryMulti(requests, responses);
+    }
+    catch (const Coordination::Exception & e)
+    {
+        return e.code;
+    }
+}
+
+zkutil::ZooKeeper::FutureExists ZooKeeperWithFaultInjection::asyncExists(std::string path, Coordination::WatchCallback watch_callback)
+{
+    auto promise = std::make_shared<std::promise<Coordination::ExistsResponse>>();
+    auto future = promise->get_future();
+    if (injectFailureBeforeOperationPromise(__func__, promise, path))
+        return future;
+
+    const char * function_name = __func__;
+    auto callback = [&, promise](const Coordination::ExistsResponse & response) mutable
+    {
+        if (injectFailureAfterOperationPromise(function_name, promise, path))
+            return;
+
+        if (response.error != Coordination::Error::ZOK && response.error != Coordination::Error::ZNONODE)
+            promise->set_exception(std::make_exception_ptr(zkutil::KeeperException::fromPath(response.error, path)));
+        else
+            promise->set_value(response);
+    };
+
+    keeper->impl->exists(
+        path,
+        std::move(callback),
+        watch_callback ? std::make_shared<Coordination::WatchCallback>(watch_callback) : Coordination::WatchCallbackPtr{});
+    return future;
+}
+
+zkutil::ZooKeeper::FutureGet ZooKeeperWithFaultInjection::asyncTryGet(std::string path)
+{
+    auto promise = std::make_shared<std::promise<Coordination::GetResponse>>();
+    auto future = promise->get_future();
+    if (injectFailureBeforeOperationPromise(__func__, promise, path))
+        return future;
+
+    const char * function_name = __func__;
+    auto callback = [&, promise](const Coordination::GetResponse & response) mutable
+    {
+        if (injectFailureAfterOperationPromise(function_name, promise, path))
+            return;
+
+        if (response.error != Coordination::Error::ZOK && response.error != Coordination::Error::ZNONODE)
+            promise->set_exception(std::make_exception_ptr(zkutil::KeeperException::fromPath(response.error, path)));
+        else
+            promise->set_value(response);
+    };
+
+    keeper->impl->get(path, std::move(callback), {});
+    return future;
+}
+
+
+zkutil::ZooKeeper::FutureMulti ZooKeeperWithFaultInjection::asyncTryMultiNoThrow(const Coordination::Requests & ops)
+{
+#ifndef NDEBUG
+    /// asyncTryMultiNoThrow is not setup to handle faults with ephemeral nodes
+    /// To do it we'd need to look at ops and save the indexes BEFORE the callback, as the ops are not
+    /// guaranteed to live until then
+    for (const auto & op : ops)
+    {
+        const auto * create_req = dynamic_cast<const Coordination::CreateRequest *>(op.get());
+        if (create_req)
+            chassert(!create_req->is_ephemeral);
+    }
+#endif
+
+    auto promise = std::make_shared<std::promise<Coordination::MultiResponse>>();
+    auto future = promise->get_future();
+    size_t request_size = ops.size();
+    String path = ops.empty() ? "" : ops.front()->getPath();
+
+    if (!keeper || (unlikely(fault_policy) && fault_policy->beforeOperation()))
+    {
+        if (logger)
+            LOG_TRACE(logger, "ZooKeeperWithFaultInjection injected fault before operation: seed={} func={} path={}", seed, __func__, path);
+        resetKeeper();
+        Coordination::MultiResponse errors;
+        for (size_t i = 0; i < request_size; i++)
+        {
+            auto r = std::make_shared<Coordination::ZooKeeperErrorResponse>();
+            r->error = RandomFaultInjection::error_before_op;
+            errors.responses.emplace_back(std::move(r));
+        }
+        promise->set_value(errors);
+        return future;
+    }
+
+    const char * function_name = __func__;
+    auto callback = [&, promise](const Coordination::MultiResponse & response) mutable
+    {
+        if (unlikely(fault_policy) && fault_policy->afterOperation())
+        {
+            if (logger)
+                LOG_TRACE(
+                    logger,
+                    "ZooKeeperWithFaultInjection injected fault after operation: seed={} func={} path={}",
+                    seed,
+                    function_name,
+                    path);
+            resetKeeper();
+            Coordination::MultiResponse errors;
+            for (size_t i = 0; i < request_size; i++)
+            {
+                auto r = std::make_shared<Coordination::ZooKeeperErrorResponse>();
+                r->error = RandomFaultInjection::error_after_op;
+                errors.responses.emplace_back(std::move(r));
+            }
+            promise->set_value(errors);
+        }
+        else
+        {
+            promise->set_value(response);
+        }
+    };
+
+    keeper->impl->multi(ops, std::move(callback));
+    return future;
+}
+
+/// Needs to match ZooKeeper::asyncTryRemove implementation
+zkutil::ZooKeeper::FutureRemove ZooKeeperWithFaultInjection::asyncTryRemove(std::string path, int32_t version)
+{
+    auto promise = std::make_shared<std::promise<Coordination::RemoveResponse>>();
+    auto future = promise->get_future();
+    if (injectFailureBeforeOperationPromise(__func__, promise, path))
+        return future;
+
+    const char * function_name = __func__;
+    auto callback = [&, promise](const Coordination::RemoveResponse & response) mutable
+    {
+        if (injectFailureAfterOperationPromise(function_name, promise, path))
+            return;
+
+        if (response.error != Coordination::Error::ZOK && response.error != Coordination::Error::ZNONODE
+            && response.error != Coordination::Error::ZBADVERSION && response.error != Coordination::Error::ZNOTEMPTY)
+        {
+            promise->set_exception(std::make_exception_ptr(zkutil::KeeperException::fromPath(response.error, path)));
+        }
+        else
+            promise->set_value(response);
+    };
+
+    keeper->impl->remove(path, version, std::move(callback));
+    return future;
+}
+
+zkutil::ZooKeeper::FutureRemove ZooKeeperWithFaultInjection::asyncTryRemoveNoThrow(const std::string & path, int32_t version)
+{
+    auto promise = std::make_shared<std::promise<Coordination::RemoveResponse>>();
+    auto future = promise->get_future();
+
+    if (!keeper || (unlikely(fault_policy) && fault_policy->beforeOperation()))
+    {
+        if (logger)
+            LOG_TRACE(logger, "ZooKeeperWithFaultInjection injected fault before operation: seed={} func={} path={}", seed, __func__, path);
+        resetKeeper();
+        Coordination::RemoveResponse r;
+        r.error = RandomFaultInjection::error_before_op;
+        promise->set_value(r);
+        return future;
+    }
+
+    const char * function_name = __func__;
+    auto callback = [&, promise](const Coordination::RemoveResponse & response) mutable
+    {
+        if (unlikely(fault_policy) && fault_policy->afterOperation())
+        {
+            if (logger)
+                LOG_TRACE(
+                    logger,
+                    "ZooKeeperWithFaultInjection injected fault after operation: seed={} func={} path={}",
+                    seed,
+                    function_name,
+                    path);
+            resetKeeper();
+            Coordination::RemoveResponse r;
+            r.error = RandomFaultInjection::error_after_op;
+            promise->set_value(r);
+        }
+        else
+        {
+            promise->set_value(response);
+        }
+    };
+
+    keeper->impl->remove(path, version, std::move(callback));
+
+    return future;
+}
+}
diff --git a/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h
index 0b0a033808f..57e1f0f3b87 100644
--- a/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h
+++ b/src/Common/ZooKeeper/ZooKeeperWithFaultInjection.h
@@ -12,10 +12,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int LOGICAL_ERROR;
-}
 
 class RandomFaultInjection
 {
@@ -23,23 +19,33 @@ public:
     bool must_fail_after_op = false;
     bool must_fail_before_op = false;
 
+    static constexpr auto msg_session_expired = "Called after fault injection";
+    static constexpr auto error_before_op = Coordination::Error::ZSESSIONEXPIRED;
+    static constexpr auto msg_before_op = "Fault injection before operation";
+    static constexpr auto error_after_op = Coordination::Error::ZOPERATIONTIMEOUT;
+    static constexpr auto msg_after_op = "Fault injection after operation";
+
     RandomFaultInjection(double probability, UInt64 seed_) : rndgen(seed_), distribution(probability) { }
 
-    void beforeOperation()
+
+    bool beforeOperation()
     {
-        if (distribution(rndgen) || must_fail_before_op)
+        if (must_fail_before_op || distribution(rndgen))
         {
             must_fail_before_op = false;
-            throw zkutil::KeeperException::fromMessage(Coordination::Error::ZSESSIONEXPIRED, "Fault injection before operation");
+            return true;
         }
+        return false;
     }
-    void afterOperation()
+
+    bool afterOperation()
     {
-        if (distribution(rndgen) || must_fail_after_op)
+        if (must_fail_after_op || distribution(rndgen))
         {
             must_fail_after_op = false;
-            throw zkutil::KeeperException::fromMessage(Coordination::Error::ZOPERATIONTIMEOUT, "Fault injection after operation");
+            return true;
         }
+        return false;
     }
 
 private:
@@ -52,563 +58,209 @@ private:
 ///
 class ZooKeeperWithFaultInjection
 {
-    template<bool async_insert>
-    friend class ReplicatedMergeTreeSinkImpl;
+    zkutil::ZooKeeper::Ptr keeper;
 
-    using zk = zkutil::ZooKeeper;
-
-    zk::Ptr keeper;
-    zk::Ptr keeper_prev;
     std::unique_ptr<RandomFaultInjection> fault_policy;
     std::string name;
     Poco::Logger * logger = nullptr;
-    UInt64 calls_total = 0;
-    UInt64 calls_without_fault_injection = 0;
     const UInt64 seed = 0;
 
-    std::vector<std::string> ephemeral_nodes;
+    std::vector<std::string> session_ephemeral_nodes;
 
-    ZooKeeperWithFaultInjection(
-        zk::Ptr const & keeper_,
-        double fault_injection_probability,
-        UInt64 fault_injection_seed,
-        std::string name_,
-        Poco::Logger * logger_)
-        : keeper(keeper_), name(std::move(name_)), logger(logger_), seed(fault_injection_seed)
-    {
-        fault_policy = std::make_unique<RandomFaultInjection>(fault_injection_probability, fault_injection_seed);
+    template <typename Operation>
+    std::invoke_result_t<Operation> executeWithFaultSync(const char * func_name, const std::string & path, Operation);
+    void injectFailureBeforeOperationThrow(const char * func_name, const String & path);
+    void injectFailureAfterOperationThrow(const char * func_name, const String & path);
+    template <typename Promise>
+    bool injectFailureBeforeOperationPromise(const char * func_name, Promise & promise, const String & path);
+    template <typename Promise>
+    bool injectFailureAfterOperationPromise(const char * func_name, Promise & promise, const String & path);
 
-        if (unlikely(logger))
-            LOG_TRACE(
-                logger,
-                "ZooKeeperWithFaultInjection created: name={} seed={} fault_probability={}",
-                name,
-                seed,
-                fault_injection_probability);
-    }
+    void resetKeeper();
+    void multiResponseSaveEphemeralNodePaths(const Coordination::Requests & requests, const Coordination::Responses & responses);
 
 public:
     using Ptr = std::shared_ptr<ZooKeeperWithFaultInjection>;
 
+    ZooKeeperWithFaultInjection(
+        zkutil::ZooKeeper::Ptr const & keeper_,
+        double fault_injection_probability,
+        UInt64 fault_injection_seed,
+        std::string name_,
+        Poco::Logger * logger_);
+
+    explicit ZooKeeperWithFaultInjection(zkutil::ZooKeeper::Ptr const & keeper_) : keeper(keeper_) { }
     static ZooKeeperWithFaultInjection::Ptr createInstance(
-        double fault_injection_probability, UInt64 fault_injection_seed, const zk::Ptr & zookeeper, std::string name, Poco::Logger * logger)
+        double fault_injection_probability,
+        UInt64 fault_injection_seed,
+        zkutil::ZooKeeper::Ptr const & zookeeper,
+        std::string name,
+        Poco::Logger * logger)
     {
         /// validate all parameters here, constructor just accept everything
-
         if (fault_injection_probability < 0.0)
             fault_injection_probability = .0;
         else if (fault_injection_probability > 1.0)
             fault_injection_probability = 1.0;
 
-        if (0 == fault_injection_seed)
+        if (fault_injection_seed == 0)
             fault_injection_seed = randomSeed();
 
         if (fault_injection_probability > 0.0)
-            return std::shared_ptr<ZooKeeperWithFaultInjection>(
-                new ZooKeeperWithFaultInjection(zookeeper, fault_injection_probability, fault_injection_seed, std::move(name), logger));
+            return std::make_shared<ZooKeeperWithFaultInjection>(
+                zookeeper, fault_injection_probability, fault_injection_seed, std::move(name), logger);
 
         /// if no fault injection provided, create instance which will not log anything
         return std::make_shared<ZooKeeperWithFaultInjection>(zookeeper);
     }
 
-    explicit ZooKeeperWithFaultInjection(zk::Ptr const & keeper_) : keeper(keeper_) { }
+    void setKeeper(zkutil::ZooKeeper::Ptr const & keeper_) { keeper = keeper_; }
+    zkutil::ZooKeeper::Ptr getKeeper() const { return keeper; }
+    bool isNull() const { return keeper.get() == nullptr; }
+    bool expired() const { return !keeper || keeper->expired(); }
+    bool isFeatureEnabled(KeeperFeatureFlag feature_flag) const { return keeper->isFeatureEnabled(feature_flag); }
 
-    ~ZooKeeperWithFaultInjection()
+    void forceFailureBeforeOperation()
     {
-        if (unlikely(logger))
-            LOG_TRACE(
-                logger,
-                "ZooKeeperWithFaultInjection report: name={} seed={} calls_total={} calls_succeeded={} calls_failed={} failure_rate={}",
-                name,
-                seed,
-                calls_total,
-                calls_without_fault_injection,
-                calls_total - calls_without_fault_injection,
-                float(calls_total - calls_without_fault_injection) / calls_total);
+        if (!fault_policy)
+            fault_policy = std::make_unique<RandomFaultInjection>(0, 0);
+        fault_policy->must_fail_before_op = true;
     }
 
-    void setKeeper(zk::Ptr const & keeper_) { keeper = keeper_; }
-    bool isNull() const { return keeper.get() == nullptr; }
-    bool expired() { return keeper->expired(); }
+    void forceFailureAfterOperation()
+    {
+        if (!fault_policy)
+            fault_policy = std::make_unique<RandomFaultInjection>(0, 0);
+        fault_policy->must_fail_after_op = true;
+    }
 
     ///
-    /// mirror ZooKeeper interface
+    /// mirror ZooKeeper interface: Sync functions
     ///
 
     Strings getChildren(
         const std::string & path,
         Coordination::Stat * stat = nullptr,
         const zkutil::EventPtr & watch = nullptr,
-        Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL)
-    {
-        return access("getChildren", path, [&]() { return keeper->getChildren(path, stat, watch, list_request_type); });
-    }
+        Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL);
+
+    zkutil::ZooKeeper::MultiGetChildrenResponse getChildren(
+        const std::vector<std::string> & paths, Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL);
 
     Coordination::Error tryGetChildren(
         const std::string & path,
         Strings & res,
         Coordination::Stat * stat = nullptr,
         const zkutil::EventPtr & watch = nullptr,
-        Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL)
-    {
-        return access("tryGetChildren", path, [&]() { return keeper->tryGetChildren(path, res, stat, watch, list_request_type); });
-    }
+        Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL);
 
-    zk::FutureExists asyncExists(const std::string & path, Coordination::WatchCallback watch_callback = {})
-    {
-        return access("asyncExists", path, [&]() { return keeper->asyncExists(path, watch_callback); });
-    }
+    zkutil::ZooKeeper::MultiTryGetChildrenResponse tryGetChildren(
+        const std::vector<std::string> & paths, Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL);
 
-    zk::FutureGet asyncTryGet(const std::string & path)
-    {
-        return access("asyncTryGet", path, [&]() { return keeper->asyncTryGet(path); });
-    }
+    Coordination::Error tryGetChildrenWatch(
+        const std::string & path,
+        Strings & res,
+        Coordination::Stat * stat,
+        Coordination::WatchCallback watch_callback,
+        Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL);
+
+    Strings getChildrenWatch(
+        const std::string & path,
+        Coordination::Stat * stat,
+        Coordination::WatchCallback watch_callback,
+        Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL);
+
+    Strings getChildrenWatch(
+        const std::string & path,
+        Coordination::Stat * stat,
+        Coordination::WatchCallbackPtr watch_callback,
+        Coordination::ListRequestType list_request_type = Coordination::ListRequestType::ALL);
 
     bool tryGet(
         const std::string & path,
         std::string & res,
         Coordination::Stat * stat = nullptr,
         const zkutil::EventPtr & watch = nullptr,
-        Coordination::Error * code = nullptr)
-    {
-        return access("tryGet", path, [&]() { return keeper->tryGet(path, res, stat, watch, code); });
-    }
+        Coordination::Error * code = nullptr);
 
-    Coordination::Error tryMulti(const Coordination::Requests & requests, Coordination::Responses & responses)
-    {
-        constexpr auto method = "tryMulti";
-        auto error = access(
-            method,
-            !requests.empty() ? requests.front()->getPath() : "",
-            [&]() { return keeper->tryMulti(requests, responses); },
-            [&](const Coordination::Error & original_error)
-            {
-                if (original_error == Coordination::Error::ZOK)
-                    faultInjectionPostAction(method, requests, responses);
-            },
-            [&]()
-            {
-                responses.clear();
-                for (size_t i = 0; i < requests.size(); ++i)
-                    responses.emplace_back(std::make_shared<Coordination::ZooKeeperErrorResponse>());
-            });
-
-
-        /// collect ephemeral nodes when no fault was injected (to clean up on demand)
-        if (unlikely(fault_policy) && Coordination::Error::ZOK == error)
-        {
-            doForEachCreatedEphemeralNode(
-                method, requests, responses, [&](const String & path_created) { ephemeral_nodes.push_back(path_created); });
-        }
-        return error;
-    }
-
-    Coordination::Error tryMultiNoThrow(const Coordination::Requests & requests, Coordination::Responses & responses)
-    {
-        constexpr auto method = "tryMultiNoThrow";
-        constexpr auto no_throw = true;
-        constexpr auto inject_failure_before_op = false;
-        auto error = access<no_throw, inject_failure_before_op>(
-            method,
-            !requests.empty() ? requests.front()->getPath() : "",
-            [&]() { return keeper->tryMultiNoThrow(requests, responses); },
-            [&](const Coordination::Error & original_error)
-            {
-                if (original_error == Coordination::Error::ZOK)
-                    faultInjectionPostAction(method, requests, responses);
-            },
-            [&]()
-            {
-                responses.clear();
-                for (size_t i = 0; i < requests.size(); ++i)
-                    responses.emplace_back(std::make_shared<Coordination::ZooKeeperErrorResponse>());
-            });
-
-        /// collect ephemeral nodes when no fault was injected (to clean up later)
-        if (unlikely(fault_policy) && Coordination::Error::ZOK == error)
-        {
-            doForEachCreatedEphemeralNode(
-                method, requests, responses, [&](const String & path_created) { ephemeral_nodes.push_back(path_created); });
-        }
-        return error;
-    }
-
-    std::string get(const std::string & path, Coordination::Stat * stat = nullptr, const zkutil::EventPtr & watch = nullptr)
-    {
-        return access("get", path, [&]() { return keeper->get(path, stat, watch); });
-    }
-
-    zkutil::ZooKeeper::MultiGetResponse get(const std::vector<std::string> & paths)
-    {
-        return access("get", !paths.empty() ? paths.front() : "", [&]() { return keeper->get(paths); });
-    }
-
-    zkutil::ZooKeeper::MultiTryGetResponse tryGet(const std::vector<std::string> & paths)
-    {
-        return access("tryGet", !paths.empty() ? paths.front() : "", [&]() { return keeper->tryGet(paths); });
-    }
-
-    bool exists(const std::string & path, Coordination::Stat * stat = nullptr, const zkutil::EventPtr & watch = nullptr)
-    {
-        return access("exists", path, [&]() { return keeper->exists(path, stat, watch); });
-    }
-
-    bool existsNoFailureInjection(const std::string & path, Coordination::Stat * stat = nullptr, const zkutil::EventPtr & watch = nullptr)
-    {
-        return access<false, false, false>("exists", path, [&]() { return keeper->exists(path, stat, watch); });
-    }
-
-    zkutil::ZooKeeper::MultiExistsResponse exists(const std::vector<std::string> & paths)
-    {
-        return access("exists", !paths.empty() ? paths.front() : "", [&]() { return keeper->exists(paths); });
-    }
-
-    std::string create(const std::string & path, const std::string & data, int32_t mode)
-    {
-        std::string path_created;
-        auto code = tryCreate(path, data, mode, path_created);
-
-        if (code != Coordination::Error::ZOK)
-            throw zkutil::KeeperException::fromPath(code, path);
-
-        return path_created;
-    }
-
-    Coordination::Error tryCreate(const std::string & path, const std::string & data, int32_t mode, std::string & path_created)
-    {
-        path_created.clear();
-
-        auto error = access(
-            "tryCreate",
-            path,
-            [&]() { return keeper->tryCreate(path, data, mode, path_created); },
-            [&](Coordination::Error & code)
-            {
-                try
-                {
-                    if (!path_created.empty() && (mode == zkutil::CreateMode::EphemeralSequential || mode == zkutil::CreateMode::Ephemeral))
-                    {
-                        keeper->remove(path_created);
-                        if (unlikely(logger))
-                            LOG_TRACE(logger, "ZooKeeperWithFaultInjection cleanup: seed={} func={} path={} path_created={} code={}",
-                                seed, "tryCreate", path, path_created, code);
-                    }
-                }
-                catch (const zkutil::KeeperException & e)
-                {
-                    if (unlikely(logger))
-                        LOG_TRACE(
-                            logger,
-                            "ZooKeeperWithFaultInjection cleanup FAILED: seed={} func={} path={} path_created={} code={} message={} ",
-                            seed,
-                            "tryCreate",
-                            path,
-                            path_created,
-                            e.code,
-                            e.message());
-                }
-            });
-
-        /// collect ephemeral nodes when no fault was injected (to clean up later)
-        if (unlikely(fault_policy))
-        {
-            if (!path_created.empty() && (mode == zkutil::CreateMode::EphemeralSequential || mode == zkutil::CreateMode::Ephemeral))
-                ephemeral_nodes.push_back(path_created);
-        }
-
-        return error;
-    }
-
-    Coordination::Error tryCreate(const std::string & path, const std::string & data, int32_t mode)
-    {
-        String path_created;
-        return tryCreate(path, data, mode, path_created);
-    }
-
-    void createIfNotExists(const std::string & path, const std::string & data)
-    {
-        std::string path_created;
-        auto code = tryCreate(path, data, zkutil::CreateMode::Persistent, path_created);
-
-        if (code == Coordination::Error::ZOK || code == Coordination::Error::ZNODEEXISTS)
-            return;
-
-        throw zkutil::KeeperException::fromPath(code, path);
-    }
-
-    Coordination::Responses multi(const Coordination::Requests & requests)
-    {
-        constexpr auto method = "multi";
-        auto result = access(
-            method,
-            !requests.empty() ? requests.front()->getPath() : "",
-            [&]() { return keeper->multi(requests); },
-            [&](Coordination::Responses & responses) { faultInjectionPostAction(method, requests, responses); });
-
-        /// collect ephemeral nodes to clean up
-        if (unlikely(fault_policy))
-        {
-            doForEachCreatedEphemeralNode(
-                method, requests, result, [&](const String & path_created) { ephemeral_nodes.push_back(path_created); });
-        }
-        return result;
-    }
-
-    void createAncestors(const std::string & path)
-    {
-        access("createAncestors", path, [&]() { return keeper->createAncestors(path); });
-    }
-
-    Coordination::Error tryRemove(const std::string & path, int32_t version = -1)
-    {
-        return access("tryRemove", path, [&]() { return keeper->tryRemove(path, version); });
-    }
-
-    void removeRecursive(const std::string & path)
-    {
-        return access("removeRecursive", path, [&]() { return keeper->removeRecursive(path); });
-    }
-
-    std::string sync(const std::string & path)
-    {
-        return access("sync", path, [&]() { return keeper->sync(path); });
-    }
-
-    Coordination::Error trySet(const std::string & path, const std::string & data, int32_t version = -1, Coordination::Stat * stat = nullptr)
-    {
-        return access("trySet", path, [&]() { return keeper->trySet(path, data, version, stat); });
-    }
-
-    void checkExistsAndGetCreateAncestorsOps(const std::string & path, Coordination::Requests & requests)
-    {
-        return access("checkExistsAndGetCreateAncestorsOps", path, [&]() { return keeper->checkExistsAndGetCreateAncestorsOps(path, requests); });
-    }
-
-    void handleEphemeralNodeExistenceNoFailureInjection(const std::string & path, const std::string & fast_delete_if_equal_value)
-    {
-        return access<false, false, false>("handleEphemeralNodeExistence", path, [&]() { return keeper->handleEphemeralNodeExistence(path, fast_delete_if_equal_value); });
-    }
-
-    void cleanupEphemeralNodes()
-    {
-        for (const auto & path : ephemeral_nodes)
-        {
-            try
-            {
-                if (keeper_prev)
-                    keeper_prev->tryRemove(path);
-            }
-            catch (...)
-            {
-                if (unlikely(logger))
-                    tryLogCurrentException(logger, "Exception during ephemeral nodes clean up");
-            }
-        }
-
-        ephemeral_nodes.clear();
-    }
-
-    bool isFeatureEnabled(KeeperFeatureFlag feature_flag) const
-    {
-        return keeper->isFeatureEnabled(feature_flag);
-    }
-
-private:
-    void faultInjectionBefore(std::function<void()> fault_cleanup)
-    {
-        try
-        {
-            if (unlikely(fault_policy))
-                fault_policy->beforeOperation();
-        }
-        catch (const zkutil::KeeperException &)
-        {
-            fault_cleanup();
-            throw;
-        }
-    }
-    void faultInjectionAfter(std::function<void()> fault_cleanup)
-    {
-        try
-        {
-            if (unlikely(fault_policy))
-                fault_policy->afterOperation();
-        }
-        catch (const zkutil::KeeperException &)
-        {
-            fault_cleanup();
-            throw;
-        }
-    }
-
-    void doForEachCreatedEphemeralNode(
-        const char * method, const Coordination::Requests & requests, const Coordination::Responses & responses, auto && action)
-    {
-        if (responses.empty())
-            return;
-
-        if (responses.size() != requests.size())
-            throw Exception(
-                ErrorCodes::LOGICAL_ERROR,
-                "Number of responses doesn't match number of requests: method={} requests={} responses={}",
-                method,
-                requests.size(),
-                responses.size());
-
-        /// find create request with ephemeral flag
-        std::vector<std::pair<size_t, const Coordination::CreateRequest *>> create_requests;
-        for (size_t i = 0; i < requests.size(); ++i)
-        {
-            const auto * create_req = dynamic_cast<const Coordination::CreateRequest *>(requests[i].get());
-            if (create_req && create_req->is_ephemeral)
-                create_requests.emplace_back(i, create_req);
-        }
-
-        for (auto && [i, req] : create_requests)
-        {
-            const auto * create_resp = dynamic_cast<const Coordination::CreateResponse *>(responses.at(i).get());
-            if (!create_resp)
-                throw Exception(
-                    ErrorCodes::LOGICAL_ERROR, "Response should be CreateResponse: method={} index={} path={}", method, i, req->path);
-
-            action(create_resp->path_created);
-        }
-    }
-
-    void faultInjectionPostAction(const char * method, const Coordination::Requests & requests, Coordination::Responses & responses)
-    {
-        doForEachCreatedEphemeralNode(method, requests, responses, [&](const String & path_created) { keeper->remove(path_created); });
-    }
-
-    template <typename T>
-    struct FaultCleanupTypeImpl
-    {
-        using Type = std::function<void(T &)>;
-    };
-
-    template <>
-    struct FaultCleanupTypeImpl<void>
-    {
-        using Type = std::function<void()>;
-    };
-
-    template <typename T>
-    using FaultCleanupType = typename FaultCleanupTypeImpl<T>::Type;
-
-    template <
-        bool no_throw_access = false,
-        bool inject_failure_before_op = true,
-        int inject_failure_after_op = true,
-        typename Operation,
-        typename Result = std::invoke_result_t<Operation>>
-    Result access(
-        const char * func_name,
+    bool tryGetWatch(
         const std::string & path,
-        Operation operation,
-        FaultCleanupType<Result> fault_after_op_cleanup = {},
-        FaultCleanupType<void> fault_before_op_cleanup = {})
-    {
-        try
-        {
-            ++calls_total;
+        std::string & res,
+        Coordination::Stat * stat,
+        Coordination::WatchCallback watch_callback,
+        Coordination::Error * code = nullptr);
 
-            if (!keeper)
-                throw zkutil::KeeperException::fromMessage(Coordination::Error::ZSESSIONEXPIRED,
-                    "Session is considered to be expired due to fault injection");
+    std::string get(const std::string & path, Coordination::Stat * stat = nullptr, const zkutil::EventPtr & watch = nullptr);
 
-            if constexpr (inject_failure_before_op)
-            {
-                faultInjectionBefore(
-                    [&]
-                    {
-                        if (fault_before_op_cleanup)
-                            fault_before_op_cleanup();
-                    });
-            }
+    zkutil::ZooKeeper::MultiGetResponse get(const std::vector<std::string> & paths);
 
-            if constexpr (!std::is_same_v<Result, void>)
-            {
-                Result res = operation();
+    zkutil::ZooKeeper::MultiTryGetResponse tryGet(const std::vector<std::string> & paths);
 
-                /// if connectivity error occurred w/o fault injection -> just return it
-                if constexpr (std::is_same_v<Coordination::Error, Result>)
-                {
-                    if (Coordination::isHardwareError(res))
-                        return res;
-                }
+    void set(const String & path, const String & data, int32_t version = -1, Coordination::Stat * stat = nullptr);
 
-                if constexpr (inject_failure_after_op)
-                {
-                    faultInjectionAfter(
-                        [&]
-                        {
-                            if (fault_after_op_cleanup)
-                                fault_after_op_cleanup(res);
-                        });
-                }
+    void remove(const String & path, int32_t version = -1);
 
-                ++calls_without_fault_injection;
+    bool exists(const std::string & path, Coordination::Stat * stat = nullptr, const zkutil::EventPtr & watch = nullptr);
 
-                if (unlikely(logger))
-                    LOG_TRACE(logger, "ZooKeeperWithFaultInjection call SUCCEEDED: seed={} func={} path={}", seed, func_name, path);
+    zkutil::ZooKeeper::MultiExistsResponse exists(const std::vector<std::string> & paths);
 
-                return res;
-            }
-            else
-            {
-                operation();
+    bool anyExists(const std::vector<std::string> & paths);
 
-                if constexpr (inject_failure_after_op)
-                {
-                    faultInjectionAfter(
-                        [&fault_after_op_cleanup]
-                        {
-                            if (fault_after_op_cleanup)
-                                fault_after_op_cleanup();
-                        });
-                }
+    std::string create(const std::string & path, const std::string & data, int32_t mode);
 
-                ++calls_without_fault_injection;
+    Coordination::Error tryCreate(const std::string & path, const std::string & data, int32_t mode, std::string & path_created);
 
-                if (unlikely(logger))
-                    LOG_TRACE(logger, "ZooKeeperWithFaultInjection call SUCCEEDED: seed={} func={} path={}", seed, func_name, path);
-            }
-        }
-        catch (const zkutil::KeeperException & e)
-        {
-            if (unlikely(logger))
-                LOG_TRACE(
-                    logger,
-                    "ZooKeeperWithFaultInjection call FAILED: seed={} func={} path={} code={} message={} ",
-                    seed,
-                    func_name,
-                    path,
-                    e.code,
-                    e.message());
+    Coordination::Error tryCreate(const std::string & path, const std::string & data, int32_t mode);
 
-            /// save valid pointer to clean up ephemeral nodes later if necessary
-            if (keeper)
-                keeper_prev = keeper;
-            keeper.reset();
+    Coordination::Responses multi(const Coordination::Requests & requests);
 
-            /// for try*NoThrow() methods
-            if constexpr (no_throw_access)
-                return e.code;
+    void createIfNotExists(const std::string & path, const std::string & data);
 
-            if constexpr (std::is_same_v<Coordination::Error, Result>)
-            {
-                /// try*() methods throws at least on hardware error and return only on user errors
-                /// todo: the methods return only on subset of user errors, and throw on another errors
-                ///       to mimic the methods exactly - we need to specify errors on which to return for each such method
-                if (Coordination::isHardwareError(e.code))
-                    throw;
+    void createOrUpdate(const std::string & path, const std::string & data, int32_t mode);
 
-                return e.code;
-            }
+    void createAncestors(const std::string & path);
 
-            throw;
-        }
-    }
+    Coordination::Error tryRemove(const std::string & path, int32_t version = -1);
+
+    void removeRecursive(const std::string & path);
+
+    void tryRemoveRecursive(const std::string & path);
+
+    void removeChildren(const std::string & path);
+
+    bool tryRemoveChildrenRecursive(
+        const std::string & path, bool probably_flat = false, zkutil::RemoveException keep_child = zkutil::RemoveException{});
+
+    bool waitForDisappear(const std::string & path, const zkutil::ZooKeeper::WaitCondition & condition = {});
+
+    std::string sync(const std::string & path);
+
+    Coordination::Error
+    trySet(const std::string & path, const std::string & data, int32_t version = -1, Coordination::Stat * stat = nullptr);
+
+    void checkExistsAndGetCreateAncestorsOps(const std::string & path, Coordination::Requests & requests);
+
+    void deleteEphemeralNodeIfContentMatches(const std::string & path, const std::string & fast_delete_if_equal_value);
+
+    Coordination::Error tryMulti(const Coordination::Requests & requests, Coordination::Responses & responses);
+
+    Coordination::Error tryMultiNoThrow(const Coordination::Requests & requests, Coordination::Responses & responses);
+
+    ///
+    /// mirror ZooKeeper interface: Async functions
+    /// Note that there is not guarantees that the parameters will live until the internal callback is called
+    /// so we might need to copy them
+    ///
+
+    zkutil::ZooKeeper::FutureExists asyncExists(std::string path, Coordination::WatchCallback watch_callback = {});
+
+    zkutil::ZooKeeper::FutureGet asyncTryGet(std::string path);
+
+    zkutil::ZooKeeper::FutureMulti asyncTryMultiNoThrow(const Coordination::Requests & ops);
+
+    zkutil::ZooKeeper::FutureRemove asyncTryRemove(std::string path, int32_t version = -1);
+
+    zkutil::ZooKeeper::FutureRemove asyncTryRemoveNoThrow(const std::string & path, int32_t version = -1);
 };
 
 using ZooKeeperWithFaultInjectionPtr = ZooKeeperWithFaultInjection::Ptr;
diff --git a/src/Common/assertProcessUserMatchesDataOwner.cpp b/src/Common/assertProcessUserMatchesDataOwner.cpp
index f2557a4aaaf..a2f87825257 100644
--- a/src/Common/assertProcessUserMatchesDataOwner.cpp
+++ b/src/Common/assertProcessUserMatchesDataOwner.cpp
@@ -31,7 +31,8 @@ namespace
         const auto error = getpwuid_r(user_id, &passwd_entry, buffer.data(), buffer_size, &result);
 
         if (error)
-            throwFromErrno("Failed to find user name for " + std::to_string(user_id), ErrorCodes::FAILED_TO_GETPWUID, error);
+            ErrnoException::throwWithErrno(
+                ErrorCodes::FAILED_TO_GETPWUID, error, "Failed to find user name for {}", std::to_string(user_id));
         else if (result)
             return result->pw_name;
         return std::to_string(user_id);
diff --git a/src/Common/atomicRename.cpp b/src/Common/atomicRename.cpp
index 69e077e38f5..44e02995858 100644
--- a/src/Common/atomicRename.cpp
+++ b/src/Common/atomicRename.cpp
@@ -87,10 +87,12 @@ static bool renameat2(const std::string & old_path, const std::string & new_path
         return false;
 
     if (errno == EEXIST)
-        throwFromErrno(fmt::format("Cannot rename {} to {} because the second path already exists", old_path, new_path), ErrorCodes::ATOMIC_RENAME_FAIL);
+        throw ErrnoException(
+            ErrorCodes::ATOMIC_RENAME_FAIL, "Cannot rename {} to {} because the second path already exists", old_path, new_path);
     if (errno == ENOENT)
-        throwFromErrno(fmt::format("Paths cannot be exchanged because {} or {} does not exist", old_path, new_path), ErrorCodes::ATOMIC_RENAME_FAIL);
-    throwFromErrnoWithPath(fmt::format("Cannot rename {} to {}", old_path, new_path), new_path, ErrorCodes::SYSTEM_ERROR);
+        throw ErrnoException(
+            ErrorCodes::ATOMIC_RENAME_FAIL, "Paths cannot be exchanged because {} or {} does not exist", old_path, new_path);
+    ErrnoException::throwFromPath(ErrorCodes::SYSTEM_ERROR, new_path, "Cannot rename {} to {}", old_path, new_path);
 }
 
 bool supportsAtomicRename()
@@ -139,11 +141,12 @@ static bool renameat2(const std::string & old_path, const std::string & new_path
     if (errnum == ENOTSUP || errnum == EINVAL)
         return false;
     if (errnum == EEXIST)
-        throwFromErrno(fmt::format("Cannot rename {} to {} because the second path already exists", old_path, new_path), ErrorCodes::ATOMIC_RENAME_FAIL);
+        throw ErrnoException(
+            ErrorCodes::ATOMIC_RENAME_FAIL, "Cannot rename {} to {} because the second path already exists", old_path, new_path);
     if (errnum == ENOENT)
-        throwFromErrno(fmt::format("Paths cannot be exchanged because {} or {} does not exist", old_path, new_path), ErrorCodes::ATOMIC_RENAME_FAIL);
-    throwFromErrnoWithPath(
-        fmt::format("Cannot rename {} to {}: {}", old_path, new_path, strerror(errnum)), new_path, ErrorCodes::SYSTEM_ERROR);
+        throw ErrnoException(
+            ErrorCodes::ATOMIC_RENAME_FAIL, "Paths cannot be exchanged because {} or {} does not exist", old_path, new_path);
+    ErrnoException::throwFromPath(ErrorCodes::SYSTEM_ERROR, new_path, "Cannot rename {} to {}", old_path, new_path);
 }
 
 
diff --git a/src/Common/checkStackSize.cpp b/src/Common/checkStackSize.cpp
index 5ab8d124fe4..8c2a0aaed7f 100644
--- a/src/Common/checkStackSize.cpp
+++ b/src/Common/checkStackSize.cpp
@@ -54,7 +54,7 @@ static size_t getStackSize(void ** out_address)
 #   if defined(OS_FREEBSD) || defined(OS_SUNOS)
     pthread_attr_init(&attr);
     if (0 != pthread_attr_get_np(pthread_self(), &attr))
-        throwFromErrno("Cannot pthread_attr_get_np", ErrorCodes::CANNOT_PTHREAD_ATTR);
+        throw ErrnoException(ErrorCodes::CANNOT_PTHREAD_ATTR, "Cannot pthread_attr_get_np");
 #   else
     if (0 != pthread_getattr_np(pthread_self(), &attr))
     {
@@ -64,14 +64,14 @@ static size_t getStackSize(void ** out_address)
             return 0;
         }
         else
-            throwFromErrno("Cannot pthread_getattr_np", ErrorCodes::CANNOT_PTHREAD_ATTR);
+            throw ErrnoException(ErrorCodes::CANNOT_PTHREAD_ATTR, "Cannot pthread_getattr_np");
     }
 #   endif
 
     SCOPE_EXIT({ pthread_attr_destroy(&attr); });
 
     if (0 != pthread_attr_getstack(&attr, &address, &size))
-        throwFromErrno("Cannot pthread_getattr_np", ErrorCodes::CANNOT_PTHREAD_ATTR);
+        throw ErrnoException(ErrorCodes::CANNOT_PTHREAD_ATTR, "Cannot pthread_attr_getstack");
 
 #ifdef USE_MUSL
     /// Adjust stack size for the main thread under musl.
diff --git a/src/Common/createHardLink.cpp b/src/Common/createHardLink.cpp
index 238851d7f01..f8a9dfa97c1 100644
--- a/src/Common/createHardLink.cpp
+++ b/src/Common/createHardLink.cpp
@@ -26,19 +26,21 @@ void createHardLink(const String & source_path, const String & destination_path)
             struct stat destination_descr;
 
             if (0 != lstat(source_path.c_str(), &source_descr))
-                throwFromErrnoWithPath("Cannot stat " + source_path, source_path, ErrorCodes::CANNOT_STAT);
+                ErrnoException::throwFromPath(ErrorCodes::CANNOT_STAT, source_path, "Cannot stat {}", source_path);
 
             if (0 != lstat(destination_path.c_str(), &destination_descr))
-                throwFromErrnoWithPath("Cannot stat " + destination_path, destination_path, ErrorCodes::CANNOT_STAT);
+                ErrnoException::throwFromPath(ErrorCodes::CANNOT_STAT, destination_path, "Cannot stat {}", destination_path);
 
             if (source_descr.st_ino != destination_descr.st_ino)
-                throwFromErrnoWithPath(
-                        "Destination file " + destination_path + " is already exist and have different inode.",
-                        destination_path, ErrorCodes::CANNOT_LINK, link_errno);
+                ErrnoException::throwFromPathWithErrno(
+                    ErrorCodes::CANNOT_LINK,
+                    destination_path,
+                    link_errno,
+                    "Destination file {} already exists and has a different inode",
+                    destination_path);
         }
         else
-            throwFromErrnoWithPath("Cannot link " + source_path + " to " + destination_path, destination_path,
-                                   ErrorCodes::CANNOT_LINK);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_LINK, destination_path, "Cannot link {} to {}", source_path, destination_path);
     }
 }
 
diff --git a/src/Common/examples/arena_with_free_lists.cpp b/src/Common/examples/arena_with_free_lists.cpp
index 3f1b3e88328..63c2f231261 100644
--- a/src/Common/examples/arena_with_free_lists.cpp
+++ b/src/Common/examples/arena_with_free_lists.cpp
@@ -248,7 +248,7 @@ int main(int argc, char ** argv)
 
         rusage resource_usage;
         if (0 != getrusage(RUSAGE_SELF, &resource_usage))
-            throwFromErrno("Cannot getrusage", ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot getrusage");
 
         size_t allocated_bytes = resource_usage.ru_maxrss * 1024;
         std::cerr << "Current memory usage: " << allocated_bytes << " bytes.\n";
diff --git a/src/Common/examples/shell_command_inout.cpp b/src/Common/examples/shell_command_inout.cpp
index 615700cd042..a646dfba311 100644
--- a/src/Common/examples/shell_command_inout.cpp
+++ b/src/Common/examples/shell_command_inout.cpp
@@ -6,6 +6,7 @@
 #include <IO/ReadBufferFromFileDescriptor.h>
 #include <IO/WriteBufferFromFileDescriptor.h>
 #include <IO/copyData.h>
+#include <iostream>
 
 /** This example shows how we can proxy stdin to ShellCommand and obtain stdout in streaming fashion. */
 
diff --git a/src/Common/examples/thread_creation_latency.cpp b/src/Common/examples/thread_creation_latency.cpp
index 60fb27dc345..d511cab9a0e 100644
--- a/src/Common/examples/thread_creation_latency.cpp
+++ b/src/Common/examples/thread_creation_latency.cpp
@@ -82,9 +82,9 @@ int main(int argc, char ** argv)
     {
         pthread_t thread;
         if (pthread_create(&thread, nullptr, g, nullptr))
-            DB::throwFromErrno("Cannot create thread.", DB::ErrorCodes::PTHREAD_ERROR);
+            throw DB::ErrnoException(DB::ErrorCodes::PTHREAD_ERROR, "Cannot create thread");
         if (pthread_join(thread, nullptr))
-            DB::throwFromErrno("Cannot join thread.", DB::ErrorCodes::PTHREAD_ERROR);
+            throw DB::ErrnoException(DB::ErrorCodes::PTHREAD_ERROR, "Cannot join thread");
     });
 
     test(n, "Create and destroy std::thread each iteration", []
diff --git a/src/Common/filesystemHelpers.cpp b/src/Common/filesystemHelpers.cpp
index eabc7bdafbb..0d3b5cb83c8 100644
--- a/src/Common/filesystemHelpers.cpp
+++ b/src/Common/filesystemHelpers.cpp
@@ -49,7 +49,7 @@ struct statvfs getStatVFS(const String & path)
     {
         if (errno == EINTR)
             continue;
-        throwFromErrnoWithPath("Could not calculate available disk space (statvfs)", path, ErrorCodes::CANNOT_STATVFS);
+        DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_STATVFS, path, "Could not calculate available disk space (statvfs)");
     }
     return fs;
 }
@@ -79,7 +79,7 @@ String getBlockDeviceId([[maybe_unused]] const String & path)
 #if defined(OS_LINUX)
     struct stat sb;
     if (lstat(path.c_str(), &sb))
-        throwFromErrnoWithPath("Cannot lstat " + path, path, ErrorCodes::CANNOT_STAT);
+        DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_STAT, path, "Cannot lstat {}", path);
     WriteBufferFromOwnString ss;
     ss << major(sb.st_dev) << ":" << minor(sb.st_dev);
     return ss.str();
@@ -164,7 +164,7 @@ std::filesystem::path getMountPoint(std::filesystem::path absolute_path)
     {
         struct stat st;
         if (stat(p.c_str(), &st))   /// NOTE: man stat does not list EINTR as possible error
-            throwFromErrnoWithPath("Cannot stat " + p.string(), p.string(), ErrorCodes::SYSTEM_ERROR);
+            DB::ErrnoException::throwFromPath(DB::ErrorCodes::SYSTEM_ERROR, p.string(), "Cannot stat {}", p.string());
         return st.st_dev;
     };
 
@@ -250,10 +250,8 @@ size_t getSizeFromFileDescriptor(int fd, const String & file_name)
     int res = fstat(fd, &buf);
     if (-1 == res)
     {
-        throwFromErrnoWithPath(
-            "Cannot execute fstat" + (file_name.empty() ? "" : " file: " + file_name),
-            file_name,
-            ErrorCodes::CANNOT_FSTAT);
+        DB::ErrnoException::throwFromPath(
+            DB::ErrorCodes::CANNOT_FSTAT, file_name, "Cannot execute fstat{}", file_name.empty() ? "" : " file: " + file_name);
     }
     return buf.st_size;
 }
@@ -263,10 +261,7 @@ Int64 getINodeNumberFromPath(const String & path)
     struct stat file_stat;
     if (stat(path.data(), &file_stat))
     {
-        throwFromErrnoWithPath(
-            "Cannot execute stat for file " + path,
-            path,
-            ErrorCodes::CANNOT_STAT);
+        DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_STAT, path, "Cannot execute stat for file {}", path);
     }
     return file_stat.st_ino;
 }
@@ -302,7 +297,7 @@ bool createFile(const std::string & path)
         close(n);
         return true;
     }
-    DB::throwFromErrnoWithPath("Cannot create file: " + path, path, DB::ErrorCodes::CANNOT_CREATE_FILE);
+    DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_CREATE_FILE, path, "Cannot create file: {}", path);
 }
 
 bool exists(const std::string & path)
@@ -317,7 +312,7 @@ bool canRead(const std::string & path)
         return true;
     if (errno == EACCES)
         return false;
-    DB::throwFromErrnoWithPath("Cannot check read access to file: " + path, path, DB::ErrorCodes::PATH_ACCESS_DENIED);
+    DB::ErrnoException::throwFromPath(DB::ErrorCodes::PATH_ACCESS_DENIED, path, "Cannot check read access to file: {}", path);
 }
 
 bool canWrite(const std::string & path)
@@ -327,7 +322,7 @@ bool canWrite(const std::string & path)
         return true;
     if (errno == EACCES)
         return false;
-    DB::throwFromErrnoWithPath("Cannot check write access to file: " + path, path, DB::ErrorCodes::PATH_ACCESS_DENIED);
+    DB::ErrnoException::throwFromPath(DB::ErrorCodes::PATH_ACCESS_DENIED, path, "Cannot check write access to file: {}", path);
 }
 
 bool canExecute(const std::string & path)
@@ -337,7 +332,7 @@ bool canExecute(const std::string & path)
         return true;
     if (errno == EACCES)
         return false;
-    DB::throwFromErrnoWithPath("Cannot check write access to file: " + path, path, DB::ErrorCodes::PATH_ACCESS_DENIED);
+    DB::ErrnoException::throwFromPath(DB::ErrorCodes::PATH_ACCESS_DENIED, path, "Cannot check execute access to file: {}", path);
 }
 
 time_t getModificationTime(const std::string & path)
@@ -369,7 +364,7 @@ void setModificationTime(const std::string & path, time_t time)
     tb.actime  = time;
     tb.modtime = time;
     if (utime(path.c_str(), &tb) != 0)
-        DB::throwFromErrnoWithPath("Cannot set modification time for file: " + path, path, DB::ErrorCodes::PATH_ACCESS_DENIED);
+        DB::ErrnoException::throwFromPath(DB::ErrorCodes::PATH_ACCESS_DENIED, path, "Cannot set modification time to file: {}", path);
 }
 
 bool isSymlink(const fs::path & path)
diff --git a/src/Common/format.h b/src/Common/format.h
index b72c4f15125..27018f64064 100644
--- a/src/Common/format.h
+++ b/src/Common/format.h
@@ -123,7 +123,7 @@ namespace Format
                         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cannot switch from automatic field numbering to manual field specification");
                     is_plain_numbering = true;
                     if (index_if_plain >= argument_number)
-                        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Argument is too big for formatting");
+                        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Not enough arguments to fill the placeholders in the format string");
                     index_positions.back() = index_if_plain++;
                 }
                 else
diff --git a/src/Common/hasLinuxCapability.cpp b/src/Common/hasLinuxCapability.cpp
index 5d823b4ecaf..bf236eb5c56 100644
--- a/src/Common/hasLinuxCapability.cpp
+++ b/src/Common/hasLinuxCapability.cpp
@@ -27,7 +27,7 @@ static __user_cap_data_struct getCapabilities()
 
     /// Avoid dependency on 'libcap'.
     if (0 != syscall(SYS_capget, &request, &response))
-        throwFromErrno("Cannot do 'capget' syscall", ErrorCodes::NETLINK_ERROR);
+        throw ErrnoException(ErrorCodes::NETLINK_ERROR, "Cannot do 'capget' syscall");
 
     return response;
 }
diff --git a/src/Common/isLocalAddress.cpp b/src/Common/isLocalAddress.cpp
index ac6daf620d0..399de9d89a0 100644
--- a/src/Common/isLocalAddress.cpp
+++ b/src/Common/isLocalAddress.cpp
@@ -28,9 +28,7 @@ struct NetworkInterfaces : public boost::noncopyable
     NetworkInterfaces()
     {
         if (getifaddrs(&ifaddr) == -1)
-        {
-            throwFromErrno("Cannot getifaddrs", ErrorCodes::SYSTEM_ERROR);
-        }
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot getifaddrs");
     }
 
     bool hasAddress(const Poco::Net::IPAddress & address) const
diff --git a/src/Common/memcpySmall.h b/src/Common/memcpySmall.h
index 5eaa1203f05..0c2aee96250 100644
--- a/src/Common/memcpySmall.h
+++ b/src/Common/memcpySmall.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <cstring>
+#include <sys/types.h> /// ssize_t
 
 #ifdef __SSE2__
 #    include <emmintrin.h>
diff --git a/src/Common/mysqlxx/Pool.cpp b/src/Common/mysqlxx/Pool.cpp
index 43df0aa6708..cc5b18214c8 100644
--- a/src/Common/mysqlxx/Pool.cpp
+++ b/src/Common/mysqlxx/Pool.cpp
@@ -52,8 +52,7 @@ void Pool::Entry::decrementRefCount()
 Pool::Pool(const Poco::Util::AbstractConfiguration & cfg, const std::string & config_name,
      unsigned default_connections_, unsigned max_connections_,
      const char * parent_config_name_)
-    : logger(Poco::Logger::get("mysqlxx::Pool"))
-    , default_connections(default_connections_)
+    : default_connections(default_connections_)
     , max_connections(max_connections_)
 {
     server = cfg.getString(config_name + ".host");
@@ -127,6 +126,38 @@ Pool::Pool(const Poco::Util::AbstractConfiguration & cfg, const std::string & co
 }
 
 
+Pool::Pool(
+    const std::string & db_,
+     const std::string & server_,
+     const std::string & user_,
+     const std::string & password_,
+     unsigned port_,
+     const std::string & socket_,
+     unsigned connect_timeout_,
+     unsigned rw_timeout_,
+     unsigned default_connections_,
+     unsigned max_connections_,
+     unsigned enable_local_infile_,
+     bool opt_reconnect_)
+    : default_connections(default_connections_)
+    , max_connections(max_connections_)
+    , db(db_)
+    , server(server_)
+    , user(user_)
+    , password(password_)
+    , port(port_)
+    , socket(socket_)
+    , connect_timeout(connect_timeout_)
+    , rw_timeout(rw_timeout_)
+    , enable_local_infile(enable_local_infile_)
+    , opt_reconnect(opt_reconnect_)
+{
+    LOG_DEBUG(log,
+        "Created MySQL Pool with settings: connect_timeout={}, read_write_timeout={}, default_connections_number={}, max_connections_number={}",
+        connect_timeout, rw_timeout, default_connections, max_connections);
+}
+
+
 Pool::~Pool()
 {
     std::lock_guard lock(mutex);
@@ -148,29 +179,29 @@ Pool::Entry Pool::get(uint64_t wait_timeout)
     initialize();
     for (;;)
     {
-        logger.trace("(%s): Iterating through existing MySQL connections", getDescription());
+        LOG_TRACE(log, "{}: Iterating through existing MySQL connections", getDescription());
 
         for (auto & connection : connections)
         {
             if (connection->ref_count == 0)
             {
-                logger.test("Found free connection in pool, returning it to the caller");
+                LOG_TEST(log, "Found free connection in pool, returning it to the caller");
                 return Entry(connection, this);
             }
         }
 
-        logger.trace("(%s): Trying to allocate a new connection.", getDescription());
+        LOG_TRACE(log, "{}: Trying to allocate a new connection.", getDescription());
         if (connections.size() < static_cast<size_t>(max_connections))
         {
             Connection * conn = allocConnection();
             if (conn)
                 return Entry(conn, this);
 
-            logger.trace("(%s): Unable to create a new connection: Allocation failed.", getDescription());
+            LOG_TRACE(log, "{}: Unable to create a new connection: Allocation failed.", getDescription());
         }
         else
         {
-            logger.trace("(%s): Unable to create a new connection: Max number of connections has been reached.", getDescription());
+            LOG_TRACE(log, "{}: Unable to create a new connection: Max number of connections has been reached.", getDescription());
         }
 
         if (!wait_timeout)
@@ -180,7 +211,7 @@ Pool::Entry Pool::get(uint64_t wait_timeout)
             throw Poco::Exception("mysqlxx::Pool is full (connection_wait_timeout is exceeded)");
 
         lock.unlock();
-        logger.trace("(%s): Sleeping for %d seconds.", getDescription(), MYSQLXX_POOL_SLEEP_ON_CONNECT_FAIL);
+        LOG_TRACE(log, "{}: Sleeping for {} seconds.", getDescription(), MYSQLXX_POOL_SLEEP_ON_CONNECT_FAIL);
         sleepForSeconds(MYSQLXX_POOL_SLEEP_ON_CONNECT_FAIL);
         lock.lock();
     }
@@ -206,7 +237,7 @@ Pool::Entry Pool::tryGet()
                     return res;
             }
 
-            logger.debug("(%s): Idle connection to MySQL server cannot be recovered, dropping it.", getDescription());
+            LOG_DEBUG(log, "{}: Idle connection to MySQL server cannot be recovered, dropping it.", getDescription());
 
             /// This one is disconnected, cannot be reestablished and so needs to be disposed of.
             connection_it = connections.erase(connection_it);
@@ -229,7 +260,7 @@ Pool::Entry Pool::tryGet()
 
 void Pool::removeConnection(Connection* connection)
 {
-    logger.trace("(%s): Removing connection.", getDescription());
+    LOG_TRACE(log, "{}: Removing connection.", getDescription());
 
     std::lock_guard lock(mutex);
     if (connection)
@@ -260,8 +291,8 @@ void Pool::Entry::forceConnected() const
         else
             sleepForSeconds(MYSQLXX_POOL_SLEEP_ON_CONNECT_FAIL);
 
-        pool->logger.debug(
-            "Creating a new MySQL connection to %s with settings: connect_timeout=%u, read_write_timeout=%u",
+        LOG_DEBUG(pool->log,
+            "Creating a new MySQL connection to {} with settings: connect_timeout={}, read_write_timeout={}",
             pool->description, pool->connect_timeout, pool->rw_timeout);
 
         data->conn.connect(
@@ -287,21 +318,21 @@ bool Pool::Entry::tryForceConnected() const
     auto * const mysql_driver = data->conn.getDriver();
     const auto prev_connection_id = mysql_thread_id(mysql_driver);
 
-    pool->logger.trace("Entry(connection %lu): sending PING to check if it is alive.", prev_connection_id);
+    LOG_TRACE(pool->log, "Entry(connection {}): sending PING to check if it is alive.", prev_connection_id);
     if (data->conn.ping())  /// Attempts to reestablish lost connection
     {
         const auto current_connection_id = mysql_thread_id(mysql_driver);
         if (prev_connection_id != current_connection_id)
         {
-            pool->logger.debug("Entry(connection %lu): Reconnected to MySQL server. Connection id changed: %lu -> %lu",
-                                current_connection_id, prev_connection_id, current_connection_id);
+            LOG_DEBUG(pool->log, "Entry(connection {}): Reconnected to MySQL server. Connection id changed: {} -> {}",
+                current_connection_id, prev_connection_id, current_connection_id);
         }
 
-        pool->logger.trace("Entry(connection %lu): PING ok.", current_connection_id);
+        LOG_TRACE(pool->log, "Entry(connection {}): PING ok.", current_connection_id);
         return true;
     }
 
-    pool->logger.trace("Entry(connection %lu): PING failed.", prev_connection_id);
+    LOG_TRACE(pool->log, "Entry(connection {}): PING failed.", prev_connection_id);
     return false;
 }
 
@@ -326,10 +357,10 @@ Pool::Connection * Pool::allocConnection(bool dont_throw_if_failed_first_time)
 
     try
     {
-        logger.debug("Connecting to %s", description);
+        LOG_DEBUG(log, "Connecting to {}", description);
 
-        logger.debug(
-            "Creating a new MySQL connection to %s with settings: connect_timeout=%u, read_write_timeout=%u",
+        LOG_DEBUG(log,
+            "Creating a new MySQL connection to {} with settings: connect_timeout={}, read_write_timeout={}",
             description, connect_timeout, rw_timeout);
 
         conn_ptr->conn.connect(
@@ -349,7 +380,7 @@ Pool::Connection * Pool::allocConnection(bool dont_throw_if_failed_first_time)
     }
     catch (mysqlxx::ConnectionFailed & e)
     {
-        logger.error(e.what());
+        LOG_ERROR(log, "Failed to connect to MySQL ({}): {}", description, e.what());
 
         if ((!was_successful && !dont_throw_if_failed_first_time)
             || e.errnum() == ER_ACCESS_DENIED_ERROR
diff --git a/src/Common/mysqlxx/Query.cpp b/src/Common/mysqlxx/Query.cpp
index 42c35d26ecf..e30ed2b75c8 100644
--- a/src/Common/mysqlxx/Query.cpp
+++ b/src/Common/mysqlxx/Query.cpp
@@ -6,7 +6,7 @@
 #include <mysql/mysql.h>
 #endif
 
-#include <Poco/Logger.h>
+#include <Common/logger_useful.h>
 
 #include <mysqlxx/Connection.h>
 #include <mysqlxx/Query.h>
@@ -52,8 +52,7 @@ void Query::executeImpl()
 {
     MYSQL* mysql_driver = conn->getDriver();
 
-    auto & logger = Poco::Logger::get("mysqlxx::Query");
-    logger.trace("Running MySQL query using connection %lu", mysql_thread_id(mysql_driver));
+    LOG_TRACE(&Poco::Logger::get("mysqlxx::Query"), "Running MySQL query using connection {}", mysql_thread_id(mysql_driver));
     if (mysql_real_query(mysql_driver, query.data(), query.size()))
     {
         const auto err_no = mysql_errno(mysql_driver);
diff --git a/src/Common/mysqlxx/mysqlxx/Pool.h b/src/Common/mysqlxx/mysqlxx/Pool.h
index 52d116e39ce..bb4d0cefbdc 100644
--- a/src/Common/mysqlxx/mysqlxx/Pool.h
+++ b/src/Common/mysqlxx/mysqlxx/Pool.h
@@ -169,28 +169,10 @@ public:
          unsigned default_connections_ = MYSQLXX_POOL_DEFAULT_START_CONNECTIONS,
          unsigned max_connections_ = MYSQLXX_POOL_DEFAULT_MAX_CONNECTIONS,
          unsigned enable_local_infile_ = MYSQLXX_DEFAULT_ENABLE_LOCAL_INFILE,
-         bool opt_reconnect_ = MYSQLXX_DEFAULT_MYSQL_OPT_RECONNECT)
-    : logger(Poco::Logger::get("mysqlxx::Pool"))
-    , default_connections(default_connections_)
-    , max_connections(max_connections_)
-    , db(db_)
-    , server(server_)
-    , user(user_)
-    , password(password_)
-    , port(port_)
-    , socket(socket_)
-    , connect_timeout(connect_timeout_)
-    , rw_timeout(rw_timeout_)
-    , enable_local_infile(enable_local_infile_)
-    , opt_reconnect(opt_reconnect_)
-    {
-        logger.debug(
-            "Created MySQL Pool with settings: connect_timeout=%u, read_write_timeout=%u, default_connections_number=%u, max_connections_number=%u",
-            connect_timeout, rw_timeout, default_connections, max_connections);
-    }
+         bool opt_reconnect_ = MYSQLXX_DEFAULT_MYSQL_OPT_RECONNECT);
 
     Pool(const Pool & other)
-        : logger(other.logger), default_connections{other.default_connections},
+        : default_connections{other.default_connections},
           max_connections{other.max_connections},
           db{other.db}, server{other.server},
           user{other.user}, password{other.password},
@@ -220,7 +202,7 @@ public:
     void removeConnection(Connection * connection);
 
 protected:
-    Poco::Logger & logger;
+    Poco::Logger * log = &Poco::Logger::get("mysqlxx::Pool");
 
     /// Number of MySQL connections which are created at launch.
     unsigned default_connections;
diff --git a/src/Common/parseRemoteDescription.cpp b/src/Common/parseRemoteDescription.cpp
index 8ea3f4a0aa5..7b2045b9de1 100644
--- a/src/Common/parseRemoteDescription.cpp
+++ b/src/Common/parseRemoteDescription.cpp
@@ -184,7 +184,7 @@ std::vector<std::pair<String, uint16_t>> parseRemoteDescriptionForExternalDataba
         }
         else
         {
-            result.emplace_back(std::make_pair(address.substr(0, colon), DB::parseFromString<UInt16>(address.substr(colon + 1))));
+            result.emplace_back(std::make_pair(address.substr(0, colon), parseFromString<UInt16>(address.substr(colon + 1))));
         }
     }
 
diff --git a/src/Common/parseRemoteDescription.h b/src/Common/parseRemoteDescription.h
index d97558c4728..12435bc68a0 100644
--- a/src/Common/parseRemoteDescription.h
+++ b/src/Common/parseRemoteDescription.h
@@ -1,8 +1,12 @@
 #pragma once
+
 #include <base/types.h>
 #include <vector>
+
+
 namespace DB
 {
+
 /* Parse a string that generates shards and replicas. Separator - one of two characters '|' or ','
  *  depending on whether shards or replicas are generated.
  * For example:
diff --git a/src/Common/randomSeed.cpp b/src/Common/randomSeed.cpp
index e10ef87283f..e9616abf7ca 100644
--- a/src/Common/randomSeed.cpp
+++ b/src/Common/randomSeed.cpp
@@ -24,7 +24,7 @@ DB::UInt64 randomSeed()
 {
     struct timespec times;
     if (clock_gettime(CLOCK_MONOTONIC, &times))
-        DB::throwFromErrno("Cannot clock_gettime.", DB::ErrorCodes::CANNOT_CLOCK_GETTIME);
+        throw DB::ErrnoException(DB::ErrorCodes::CANNOT_CLOCK_GETTIME, "Cannot clock_gettime");
 
     /// Not cryptographically secure as time, pid and stack address can be predictable.
 
diff --git a/src/Common/remapExecutable.cpp b/src/Common/remapExecutable.cpp
index 206314ea295..911447d3adc 100644
--- a/src/Common/remapExecutable.cpp
+++ b/src/Common/remapExecutable.cpp
@@ -120,7 +120,7 @@ __attribute__((__noinline__)) void remapToHugeStep1(void * begin, size_t size)
 
     void * scratch = mmap(nullptr, size, PROT_READ | PROT_WRITE | PROT_EXEC, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
     if (MAP_FAILED == scratch)
-        throwFromErrno(fmt::format("Cannot mmap {} bytes", size), ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+        throw ErrnoException(ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Cannot mmap {} bytes", size);
 
     memcpy(scratch, begin, size);
 
diff --git a/src/Common/setThreadName.cpp b/src/Common/setThreadName.cpp
index f90398825af..aae80272206 100644
--- a/src/Common/setThreadName.cpp
+++ b/src/Common/setThreadName.cpp
@@ -28,25 +28,31 @@ namespace ErrorCodes
 static thread_local char thread_name[THREAD_NAME_SIZE]{};
 
 
-void setThreadName(const char * name)
+void setThreadName(const char * name, bool truncate)
 {
-    if (strlen(name) > THREAD_NAME_SIZE - 1)
+    size_t name_len = strlen(name);
+    if (!truncate && name_len > THREAD_NAME_SIZE - 1)
         throw DB::Exception(DB::ErrorCodes::PTHREAD_ERROR, "Thread name cannot be longer than 15 bytes");
 
+    size_t name_capped_len = std::min<size_t>(1 + name_len, THREAD_NAME_SIZE - 1);
+    char name_capped[THREAD_NAME_SIZE];
+    memcpy(name_capped, name, name_capped_len);
+    name_capped[name_capped_len] = '\0';
+
 #if defined(OS_FREEBSD)
-    pthread_set_name_np(pthread_self(), name);
+    pthread_set_name_np(pthread_self(), name_capped);
     if ((false))
 #elif defined(OS_DARWIN)
-    if (0 != pthread_setname_np(name))
+    if (0 != pthread_setname_np(name_capped))
 #elif defined(OS_SUNOS)
-    if (0 != pthread_setname_np(pthread_self(), name))
+    if (0 != pthread_setname_np(pthread_self(), name_capped))
 #else
-    if (0 != prctl(PR_SET_NAME, name, 0, 0, 0))
+    if (0 != prctl(PR_SET_NAME, name_capped, 0, 0, 0))
 #endif
         if (errno != ENOSYS && errno != EPERM)    /// It's ok if the syscall is unsupported or not allowed in some environments.
-            DB::throwFromErrno("Cannot set thread name with prctl(PR_SET_NAME, ...)", DB::ErrorCodes::PTHREAD_ERROR);
+            throw DB::ErrnoException(DB::ErrorCodes::PTHREAD_ERROR, "Cannot set thread name with prctl(PR_SET_NAME, ...)");
 
-    memcpy(thread_name, name, std::min<size_t>(1 + strlen(name), THREAD_NAME_SIZE - 1));
+    memcpy(thread_name, name_capped, name_capped_len);
 }
 
 const char * getThreadName()
@@ -64,7 +70,7 @@ const char * getThreadName()
 #else
     if (0 != prctl(PR_GET_NAME, thread_name, 0, 0, 0))
         if (errno != ENOSYS && errno != EPERM)    /// It's ok if the syscall is unsupported or not allowed in some environments.
-            DB::throwFromErrno("Cannot get thread name with prctl(PR_GET_NAME)", DB::ErrorCodes::PTHREAD_ERROR);
+            throw DB::ErrnoException(DB::ErrorCodes::PTHREAD_ERROR, "Cannot get thread name with prctl(PR_GET_NAME)");
 #endif
 
     return thread_name;
diff --git a/src/Common/setThreadName.h b/src/Common/setThreadName.h
index 1834ea9696f..fdb2717925f 100644
--- a/src/Common/setThreadName.h
+++ b/src/Common/setThreadName.h
@@ -4,7 +4,9 @@
 /** Sets the thread name (maximum length is 15 bytes),
   *  which will be visible in ps, gdb, /proc,
   *  for convenience of observation and debugging.
+  *
+  * @param truncate - if true, will truncate to 15 automatically, otherwise throw
   */
-void setThreadName(const char * name);
+void setThreadName(const char * name, bool truncate = false);
 
 const char * getThreadName();
diff --git a/src/Common/tests/gtest_async_loader.cpp b/src/Common/tests/gtest_async_loader.cpp
index f2e741e4b9f..5c54dedbbde 100644
--- a/src/Common/tests/gtest_async_loader.cpp
+++ b/src/Common/tests/gtest_async_loader.cpp
@@ -902,66 +902,6 @@ TEST(AsyncLoader, SetMaxThreads)
     t.loader.wait();
 }
 
-TEST(AsyncLoader, DynamicPools)
-{
-    const size_t max_threads[] { 2, 10 };
-    const int jobs_in_chain = 16;
-    AsyncLoaderTest t({
-        {.max_threads = max_threads[0], .priority{0}},
-        {.max_threads = max_threads[1], .priority{-1}},
-    });
-
-    t.loader.start();
-
-    std::atomic<size_t> executing[2] { 0, 0 }; // Number of currently executing jobs per pool
-
-    for (int concurrency = 1; concurrency <= 12; concurrency++)
-    {
-        std::atomic<bool> boosted{false}; // Visible concurrency was increased
-        std::atomic<int> left{concurrency * jobs_in_chain / 2}; // Number of jobs to start before `prioritize()` call
-        std::shared_mutex prioritization_mutex; // To slow down job execution during prioritization to avoid race condition
-
-        LoadJobSet jobs_to_prioritize;
-
-        auto job_func = [&] (AsyncLoader & loader, const LoadJobPtr & self)
-        {
-            auto pool_id = self->executionPool();
-            executing[pool_id]++;
-            if (executing[pool_id] > max_threads[0])
-                boosted = true;
-            ASSERT_LE(executing[pool_id], max_threads[pool_id]);
-
-            // Dynamic prioritization
-            if (--left == 0)
-            {
-                std::unique_lock lock{prioritization_mutex};
-                for (const auto & job : jobs_to_prioritize)
-                    loader.prioritize(job, 1);
-            }
-
-            std::shared_lock lock{prioritization_mutex};
-            t.randomSleepUs(100, 200, 100);
-
-            ASSERT_LE(executing[pool_id], max_threads[pool_id]);
-            executing[pool_id]--;
-        };
-
-        std::vector<LoadTaskPtr> tasks;
-        tasks.reserve(concurrency);
-        for (int i = 0; i < concurrency; i++)
-            tasks.push_back(makeLoadTask(t.loader, t.chainJobSet(jobs_in_chain, job_func, fmt::format("c{}-j", i))));
-        jobs_to_prioritize = getGoals(tasks); // All jobs
-        scheduleLoad(tasks);
-        waitLoad(tasks);
-
-        ASSERT_EQ(executing[0], 0);
-        ASSERT_EQ(executing[1], 0);
-        ASSERT_EQ(boosted, concurrency > 2);
-        boosted = false;
-    }
-
-}
-
 TEST(AsyncLoader, SubJobs)
 {
     AsyncLoaderTest t(1);
@@ -1000,7 +940,7 @@ TEST(AsyncLoader, SubJobs)
         std::atomic<int> jobs_left;
         // It is a good practice to keep load task inside the component:
         // 1) to make sure it outlives its load jobs;
-        // 2) to avoid removing load jobs from `system.async_loader` while we use the component
+        // 2) to avoid removing load jobs from `system.asynchronous_loader` while we use the component
         LoadTaskPtr load_task;
     };
 
@@ -1070,7 +1010,7 @@ TEST(AsyncLoader, RecursiveJob)
         std::atomic<int> jobs_left;
         // It is a good practice to keep load task inside the component:
         // 1) to make sure it outlives its load jobs;
-        // 2) to avoid removing load jobs from `system.async_loader` while we use the component
+        // 2) to avoid removing load jobs from `system.asynchronous_loader` while we use the component
         LoadTaskPtr load_task;
     };
 
diff --git a/src/Common/tests/gtest_config_dot.cpp b/src/Common/tests/gtest_config_dot.cpp
new file mode 100644
index 00000000000..d88d896677b
--- /dev/null
+++ b/src/Common/tests/gtest_config_dot.cpp
@@ -0,0 +1,30 @@
+#include <Common/Config/ConfigHelper.h>
+#include <Poco/AutoPtr.h>
+#include <Poco/Util/XMLConfiguration.h>
+#include <Poco/DOM/DOMParser.h>
+
+#include <gtest/gtest.h>
+
+
+using namespace DB;
+
+TEST(Common, ConfigWithDotInKeys)
+{
+    std::string xml(R"CONFIG(<clickhouse>
+    <foo.bar>1</foo.bar>
+</clickhouse>)CONFIG");
+
+    Poco::XML::DOMParser dom_parser;
+    Poco::AutoPtr<Poco::XML::Document> document = dom_parser.parseString(xml);
+    Poco::AutoPtr<Poco::Util::XMLConfiguration> config = new Poco::Util::XMLConfiguration(document);
+
+    /// directly
+    EXPECT_EQ(ConfigHelper::getBool(*config, "foo.bar", false, false), false);
+    EXPECT_EQ(ConfigHelper::getBool(*config, "foo\\.bar", false, false), true);
+
+    /// via keys()
+    Poco::Util::AbstractConfiguration::Keys keys;
+    config->keys("", keys);
+    ASSERT_EQ(1, keys.size());
+    ASSERT_EQ("foo\\.bar", keys[0]);
+}
diff --git a/src/Common/tests/gtest_rw_lock.cpp b/src/Common/tests/gtest_rw_lock.cpp
index 5ea50f70d4e..08a14aba8fb 100644
--- a/src/Common/tests/gtest_rw_lock.cpp
+++ b/src/Common/tests/gtest_rw_lock.cpp
@@ -24,6 +24,41 @@ namespace DB
 }
 
 
+namespace
+{
+    class Events
+    {
+    public:
+        Events() : start_time(std::chrono::steady_clock::now()) {}
+
+        void add(String && event, std::chrono::milliseconds correction = std::chrono::milliseconds::zero())
+        {
+            String timepoint = std::to_string(std::chrono::duration_cast<std::chrono::milliseconds>(std::chrono::steady_clock::now() - start_time).count());
+            if (timepoint.length() < 5)
+                timepoint.insert(0, 5 - timepoint.length(), ' ');
+            if (correction.count())
+                std::this_thread::sleep_for(correction);
+            std::lock_guard lock{mutex};
+            //std::cout << timepoint << " : " << event << std::endl;
+            events.emplace_back(std::move(event));
+        }
+
+        void check(const Strings & expected_events)
+        {
+            std::lock_guard lock{mutex};
+            EXPECT_EQ(events.size(), expected_events.size());
+            for (size_t i = 0; i != events.size(); ++i)
+                EXPECT_EQ(events[i], (i < expected_events.size() ? expected_events[i] : ""));
+        }
+
+    private:
+        const std::chrono::time_point<std::chrono::steady_clock> start_time;
+        Strings events TSA_GUARDED_BY(mutex);
+        mutable std::mutex mutex;
+    };
+}
+
+
 TEST(Common, RWLock1)
 {
     /// Tests with threads require this, because otherwise
@@ -287,3 +322,260 @@ TEST(Common, RWLockNotUpgradeableWithNoQuery)
 
     read_thread.join();
 }
+
+
+TEST(Common, RWLockWriteLockTimeoutDuringRead)
+{
+    /// 0                 100                         200                      300                 400
+    /// <---------------------------------------- ra ---------------------------------------------->
+    ///                     <----- wc (acquiring lock, failed by timeout) ----->
+    ///                                                                                             <wd>
+    ///
+    ///    0 : Locking ra
+    ///    0 : Locked ra
+    ///  100 : Locking wc
+    ///  300 : Failed to lock wc
+    ///  400 : Unlocking ra
+    ///  400 : Unlocked ra
+    ///  400 : Locking wd
+    ///  400 : Locked wd
+    ///  400 : Unlocking wd
+    ///  400 : Unlocked wd
+
+    static auto rw_lock = RWLockImpl::create();
+    Events events;
+
+    std::thread ra_thread([&] ()
+    {
+        events.add("Locking ra");
+        auto ra = rw_lock->getLock(RWLockImpl::Read, "ra");
+        events.add(ra ? "Locked ra" : "Failed to lock ra");
+        EXPECT_NE(ra, nullptr);
+
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(400));
+
+        events.add("Unlocking ra");
+        ra.reset();
+        events.add("Unlocked ra");
+    });
+
+    std::thread wc_thread([&] ()
+    {
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(100));
+        events.add("Locking wc");
+        auto wc = rw_lock->getLock(RWLockImpl::Write, "wc", std::chrono::milliseconds(200));
+        events.add(wc ? "Locked wc" : "Failed to lock wc");
+        EXPECT_EQ(wc, nullptr);
+    });
+
+    ra_thread.join();
+    wc_thread.join();
+
+    {
+        events.add("Locking wd");
+        auto wd = rw_lock->getLock(RWLockImpl::Write, "wd", std::chrono::milliseconds(1000));
+        events.add(wd ? "Locked wd" : "Failed to lock wd");
+        EXPECT_NE(wd, nullptr);
+        events.add("Unlocking wd");
+        wd.reset();
+        events.add("Unlocked wd");
+    }
+
+    events.check(
+        {"Locking ra",
+         "Locked ra",
+         "Locking wc",
+         "Failed to lock wc",
+         "Unlocking ra",
+         "Unlocked ra",
+         "Locking wd",
+         "Locked wd",
+         "Unlocking wd",
+         "Unlocked wd"});
+}
+
+
+TEST(Common, RWLockWriteLockTimeoutDuringTwoReads)
+{
+    /// 0                 100                         200                         300               400                500
+    /// <---------------------------------------- ra ----------------------------------------------->
+    ///                     <------ wc (acquiring lock, failed by timeout) ------->
+    ///                                                 <-- rb (acquiring lock) --><---------- rb (locked) ------------>
+    ///                                                                                                                 <wd>
+    ///
+    ///    0 : Locking ra
+    ///    0 : Locked ra
+    ///  100 : Locking wc
+    ///  200 : Locking rb
+    ///  300 : Failed to lock wc
+    ///  300 : Locked rb
+    ///  400 : Unlocking ra
+    ///  400 : Unlocked ra
+    ///  500 : Unlocking rb
+    ///  500 : Unlocked rb
+    ///  501 : Locking wd
+    ///  501 : Locked wd
+    ///  501 : Unlocking wd
+    ///  501 : Unlocked wd
+
+    static auto rw_lock = RWLockImpl::create();
+    Events events;
+
+    std::thread ra_thread([&] ()
+    {
+        events.add("Locking ra");
+        auto ra = rw_lock->getLock(RWLockImpl::Read, "ra");
+        events.add(ra ? "Locked ra" : "Failed to lock ra");
+        EXPECT_NE(ra, nullptr);
+
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(400));
+
+        events.add("Unlocking ra");
+        ra.reset();
+        events.add("Unlocked ra");
+    });
+
+    std::thread rb_thread([&] ()
+    {
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(200));
+        events.add("Locking rb");
+
+        auto rb = rw_lock->getLock(RWLockImpl::Read, "rb");
+
+        /// `correction` is used here to add an event to `events` a little later.
+        /// (Because the event "Locked rb" happens at nearly the same time as "Failed to lock wc" and we don't want our test to be flaky.)
+        auto correction = std::chrono::duration<int, std::milli>(50);
+        events.add(rb ? "Locked rb" : "Failed to lock rb", correction);
+        EXPECT_NE(rb, nullptr);
+
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(200) - correction);
+        events.add("Unlocking rb");
+        rb.reset();
+        events.add("Unlocked rb");
+    });
+
+    std::thread wc_thread([&] ()
+    {
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(100));
+        events.add("Locking wc");
+        auto wc = rw_lock->getLock(RWLockImpl::Write, "wc", std::chrono::milliseconds(200));
+        events.add(wc ? "Locked wc" : "Failed to lock wc");
+        EXPECT_EQ(wc, nullptr);
+    });
+
+    ra_thread.join();
+    rb_thread.join();
+    wc_thread.join();
+
+    {
+        events.add("Locking wd");
+        auto wd = rw_lock->getLock(RWLockImpl::Write, "wd", std::chrono::milliseconds(1000));
+        events.add(wd ? "Locked wd" : "Failed to lock wd");
+        EXPECT_NE(wd, nullptr);
+        events.add("Unlocking wd");
+        wd.reset();
+        events.add("Unlocked wd");
+    }
+
+    events.check(
+        {"Locking ra",
+         "Locked ra",
+         "Locking wc",
+         "Locking rb",
+         "Failed to lock wc",
+         "Locked rb",
+         "Unlocking ra",
+         "Unlocked ra",
+         "Unlocking rb",
+         "Unlocked rb",
+         "Locking wd",
+         "Locked wd",
+         "Unlocking wd",
+         "Unlocked wd"});
+}
+
+
+TEST(Common, RWLockWriteLockTimeoutDuringWriteWithWaitingRead)
+{
+    /// 0                 100                         200                        300                 400                500
+    /// <--------------------------------------------------- wa -------------------------------------------------------->
+    ///                     <------ wb (acquiring lock, failed by timeout) ------>
+    ///                                                 <-- rc (acquiring lock, failed by timeout) -->
+    ///                                                                                                                  <wd>
+    ///
+    ///    0 : Locking wa
+    ///    0 : Locked wa
+    ///  100 : Locking wb
+    ///  200 : Locking rc
+    ///  300 : Failed to lock wb
+    ///  400 : Failed to lock rc
+    ///  500 : Unlocking wa
+    ///  500 : Unlocked wa
+    ///  501 : Locking wd
+    ///  501 : Locked wd
+    ///  501 : Unlocking wd
+    ///  501 : Unlocked wd
+
+    static auto rw_lock = RWLockImpl::create();
+    Events events;
+
+    std::thread wa_thread([&] ()
+    {
+        events.add("Locking wa");
+        auto wa = rw_lock->getLock(RWLockImpl::Write, "wa");
+        events.add(wa ? "Locked wa" : "Failed to lock wa");
+        EXPECT_NE(wa, nullptr);
+
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(500));
+
+        events.add("Unlocking wa");
+        wa.reset();
+        events.add("Unlocked wa");
+    });
+
+    std::thread wb_thread([&] ()
+    {
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(100));
+        events.add("Locking wb");
+        auto wc = rw_lock->getLock(RWLockImpl::Write, "wc", std::chrono::milliseconds(200));
+        events.add(wc ? "Locked wb" : "Failed to lock wb");
+        EXPECT_EQ(wc, nullptr);
+    });
+    
+    std::thread rc_thread([&] ()
+    {
+        std::this_thread::sleep_for(std::chrono::duration<int, std::milli>(200));
+        events.add("Locking rc");
+        auto rc = rw_lock->getLock(RWLockImpl::Read, "rc", std::chrono::milliseconds(200));
+        events.add(rc ? "Locked rc" : "Failed to lock rc");
+        EXPECT_EQ(rc, nullptr);
+    });
+
+    wa_thread.join();
+    wb_thread.join();
+    rc_thread.join();
+
+    {
+        events.add("Locking wd");
+        auto wd = rw_lock->getLock(RWLockImpl::Write, "wd", std::chrono::milliseconds(1000));
+        events.add(wd ? "Locked wd" : "Failed to lock wd");
+        EXPECT_NE(wd, nullptr);
+        events.add("Unlocking wd");
+        wd.reset();
+        events.add("Unlocked wd");
+    }
+
+    events.check(
+        {"Locking wa",
+         "Locked wa",
+         "Locking wb",
+         "Locking rc",
+         "Failed to lock wb",
+         "Failed to lock rc",
+         "Unlocking wa",
+         "Unlocked wa",
+         "Locking wd",
+         "Locked wd",
+         "Unlocking wd",
+         "Unlocked wd"});
+}
diff --git a/src/Compression/CompressionCodecDeflateQpl.cpp b/src/Compression/CompressionCodecDeflateQpl.cpp
index 25d809c9726..ee0356adde5 100644
--- a/src/Compression/CompressionCodecDeflateQpl.cpp
+++ b/src/Compression/CompressionCodecDeflateQpl.cpp
@@ -11,6 +11,7 @@
 #include "libaccel_config.h"
 #include <Common/MemorySanitizer.h>
 #include <base/scope_guard.h>
+#include <base/getPageSize.h>
 #include <immintrin.h>
 
 
diff --git a/src/Compression/examples/compressed_buffer.cpp b/src/Compression/examples/compressed_buffer.cpp
index aef2cf4ab90..74646ff0f28 100644
--- a/src/Compression/examples/compressed_buffer.cpp
+++ b/src/Compression/examples/compressed_buffer.cpp
@@ -23,7 +23,7 @@ int main(int, char **)
         Stopwatch stopwatch;
 
         {
-            DB::WriteBufferFromFile buf("test1", DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
+            DB::WriteBufferFromFile buf("test1", DB::DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
             DB::CompressedWriteBuffer compressed_buf(buf);
 
             stopwatch.restart();
diff --git a/src/Coordination/KeeperAsynchronousMetrics.cpp b/src/Coordination/KeeperAsynchronousMetrics.cpp
index 890079e98f7..4471012e917 100644
--- a/src/Coordination/KeeperAsynchronousMetrics.cpp
+++ b/src/Coordination/KeeperAsynchronousMetrics.cpp
@@ -113,6 +113,12 @@ KeeperAsynchronousMetrics::KeeperAsynchronousMetrics(
 {
 }
 
+KeeperAsynchronousMetrics::~KeeperAsynchronousMetrics()
+{
+    /// NOTE: stop() from base class is not enough, since this leads to leak on vptr
+    stop();
+}
+
 void KeeperAsynchronousMetrics::updateImpl(AsynchronousMetricValues & new_values, TimePoint /*update_time*/, TimePoint /*current_time*/)
 {
 #if USE_NURAFT
diff --git a/src/Coordination/KeeperAsynchronousMetrics.h b/src/Coordination/KeeperAsynchronousMetrics.h
index 14092c11c15..457a7112507 100644
--- a/src/Coordination/KeeperAsynchronousMetrics.h
+++ b/src/Coordination/KeeperAsynchronousMetrics.h
@@ -14,6 +14,7 @@ class KeeperAsynchronousMetrics : public AsynchronousMetrics
 public:
     KeeperAsynchronousMetrics(
         ContextPtr context_, int update_period_seconds, const ProtocolServerMetricsFunc & protocol_server_metrics_func_);
+    ~KeeperAsynchronousMetrics() override;
 
 private:
     ContextPtr context;
diff --git a/src/Coordination/KeeperContext.cpp b/src/Coordination/KeeperContext.cpp
index c3cb166abee..6bb5b066d9f 100644
--- a/src/Coordination/KeeperContext.cpp
+++ b/src/Coordination/KeeperContext.cpp
@@ -59,6 +59,8 @@ void KeeperContext::initialize(const Poco::Util::AbstractConfiguration & config,
         }
     }
 
+    updateKeeperMemorySoftLimit(config);
+
     digest_enabled = config.getBool("keeper_server.digest_enabled", false);
     ignore_system_path_on_startup = config.getBool("keeper_server.ignore_system_path_on_startup", false);
 
@@ -69,7 +71,7 @@ void KeeperContext::initialize(const Poco::Util::AbstractConfiguration & config,
 namespace
 {
 
-bool diskValidator(const Poco::Util::AbstractConfiguration & config, const std::string & disk_config_prefix)
+bool diskValidator(const Poco::Util::AbstractConfiguration & config, const std::string & disk_config_prefix, const std::string &)
 {
     const auto disk_type = config.getString(disk_config_prefix + ".type", "local");
 
@@ -375,4 +377,10 @@ void KeeperContext::initializeFeatureFlags(const Poco::Util::AbstractConfigurati
     feature_flags.logFlags(&Poco::Logger::get("KeeperContext"));
 }
 
+void KeeperContext::updateKeeperMemorySoftLimit(const Poco::Util::AbstractConfiguration & config)
+{
+    if (config.hasProperty("keeper_server.max_memory_usage_soft_limit"))
+        memory_soft_limit = config.getUInt64("keeper_server.max_memory_usage_soft_limit");
+}
+
 }
diff --git a/src/Coordination/KeeperContext.h b/src/Coordination/KeeperContext.h
index 1af34b19ccf..c1c34db2c4b 100644
--- a/src/Coordination/KeeperContext.h
+++ b/src/Coordination/KeeperContext.h
@@ -53,6 +53,9 @@ public:
 
     constexpr KeeperDispatcher * getDispatcher() const { return dispatcher; }
 
+    UInt64 getKeeperMemorySoftLimit() const { return memory_soft_limit; }
+    void updateKeeperMemorySoftLimit(const Poco::Util::AbstractConfiguration & config);
+
     /// set to true when we have preprocessed or committed all the logs
     /// that were already present locally during startup
     std::atomic<bool> local_logs_preprocessed = false;
@@ -92,6 +95,8 @@ private:
 
     KeeperFeatureFlags feature_flags;
     KeeperDispatcher * dispatcher{nullptr};
+
+    std::atomic<UInt64> memory_soft_limit = 0;
 };
 
 using KeeperContextPtr = std::shared_ptr<KeeperContext>;
diff --git a/src/Coordination/KeeperDispatcher.cpp b/src/Coordination/KeeperDispatcher.cpp
index f69a9c11e97..dcd22552fe3 100644
--- a/src/Coordination/KeeperDispatcher.cpp
+++ b/src/Coordination/KeeperDispatcher.cpp
@@ -51,6 +51,56 @@ namespace ErrorCodes
     extern const int SYSTEM_ERROR;
 }
 
+namespace
+{
+
+bool checkIfRequestIncreaseMem(const Coordination::ZooKeeperRequestPtr & request)
+{
+    if (request->getOpNum() == Coordination::OpNum::Create
+        || request->getOpNum() == Coordination::OpNum::CreateIfNotExists
+        || request->getOpNum() == Coordination::OpNum::Set)
+    {
+        return true;
+    }
+    else if (request->getOpNum() == Coordination::OpNum::Multi)
+    {
+        Coordination::ZooKeeperMultiRequest & multi_req = dynamic_cast<Coordination::ZooKeeperMultiRequest &>(*request);
+        Int64 memory_delta = 0;
+        for (const auto & sub_req : multi_req.requests)
+        {
+            auto sub_zk_request = std::dynamic_pointer_cast<Coordination::ZooKeeperRequest>(sub_req);
+            switch (sub_zk_request->getOpNum())
+            {
+                case Coordination::OpNum::Create:
+                case Coordination::OpNum::CreateIfNotExists:
+                {
+                    Coordination::ZooKeeperCreateRequest & create_req = dynamic_cast<Coordination::ZooKeeperCreateRequest &>(*sub_zk_request);
+                    memory_delta += create_req.bytesSize();
+                    break;
+                }
+                case Coordination::OpNum::Set:
+                {
+                    Coordination::ZooKeeperSetRequest & set_req = dynamic_cast<Coordination::ZooKeeperSetRequest &>(*sub_zk_request);
+                    memory_delta += set_req.bytesSize();
+                    break;
+                }
+                case Coordination::OpNum::Remove:
+                {
+                    Coordination::ZooKeeperRemoveRequest & remove_req = dynamic_cast<Coordination::ZooKeeperRemoveRequest &>(*sub_zk_request);
+                    memory_delta -= remove_req.bytesSize();
+                    break;
+                }
+                default:
+                    break;
+            }
+        }
+        return memory_delta > 0;
+    }
+
+    return false;
+}
+
+}
 
 KeeperDispatcher::KeeperDispatcher()
     : responses_queue(std::numeric_limits<size_t>::max())
@@ -93,6 +143,14 @@ void KeeperDispatcher::requestThread()
                 if (shutdown_called)
                     break;
 
+                Int64 mem_soft_limit = keeper_context->getKeeperMemorySoftLimit();
+                if (configuration_and_settings->standalone_keeper && mem_soft_limit > 0 && total_memory_tracker.get() >= mem_soft_limit && checkIfRequestIncreaseMem(request.request))
+                {
+                    LOG_TRACE(log, "Processing requests refused because of max_memory_usage_soft_limit {}, the total used memory is {}, request type is {}", mem_soft_limit, total_memory_tracker.get(), request.request->getOpNum());
+                    addErrorResponses({request}, Coordination::Error::ZCONNECTIONLOSS);
+                    continue;
+                }
+
                 KeeperStorage::RequestsForSessions current_batch;
                 size_t current_batch_bytes_size = 0;
 
@@ -872,6 +930,8 @@ void KeeperDispatcher::updateConfiguration(const Poco::Util::AbstractConfigurati
                 throw Exception(ErrorCodes::SYSTEM_ERROR, "Cannot push configuration update to queue");
 
     snapshot_s3.updateS3Configuration(config, macros);
+
+    keeper_context->updateKeeperMemorySoftLimit(config);
 }
 
 void KeeperDispatcher::updateKeeperStatLatency(uint64_t process_time_ms)
diff --git a/src/Coordination/KeeperServer.cpp b/src/Coordination/KeeperServer.cpp
index bc5e3a723f2..fb56d58cb72 100644
--- a/src/Coordination/KeeperServer.cpp
+++ b/src/Coordination/KeeperServer.cpp
@@ -660,6 +660,12 @@ nuraft::cb_func::ReturnCode KeeperServer::callbackFunc(nuraft::cb_func::Type typ
 
         switch (type)
         {
+            case nuraft::cb_func::PreAppendLogLeader:
+            {
+                /// we cannot preprocess anything new as leader because we don't have up-to-date in-memory state
+                /// until we preprocess all stored logs
+                return nuraft::cb_func::ReturnCode::ReturnNull;
+            }
             case nuraft::cb_func::InitialBatchCommited:
             {
                 preprocess_logs();
@@ -859,6 +865,10 @@ nuraft::cb_func::ReturnCode KeeperServer::callbackFunc(nuraft::cb_func::Type typ
             initial_batch_committed = true;
             return nuraft::cb_func::ReturnCode::Ok;
         }
+        case nuraft::cb_func::PreAppendLogLeader:
+        {
+            return nuraft::cb_func::ReturnCode::ReturnNull;
+        }
         case nuraft::cb_func::PreAppendLogFollower:
         {
             const auto & entry = *static_cast<LogEntryPtr *>(param->ctx);
diff --git a/src/Coordination/KeeperSnapshotManagerS3.cpp b/src/Coordination/KeeperSnapshotManagerS3.cpp
index ee62f6471e7..910615bf6ef 100644
--- a/src/Coordination/KeeperSnapshotManagerS3.cpp
+++ b/src/Coordination/KeeperSnapshotManagerS3.cpp
@@ -13,6 +13,7 @@
 #include <IO/ReadBufferFromFile.h>
 #include <IO/ReadHelpers.h>
 #include <IO/S3/PocoHTTPClient.h>
+#include <IO/S3/Client.h>
 #include <IO/WriteHelpers.h>
 #include <IO/copyData.h>
 #include <Common/Macros.h>
@@ -76,7 +77,7 @@ void KeeperSnapshotManagerS3::updateS3Configuration(const Poco::Util::AbstractCo
 
         LOG_INFO(log, "S3 configuration was updated");
 
-        auto credentials = Aws::Auth::AWSCredentials(auth_settings.access_key_id, auth_settings.secret_access_key);
+        auto credentials = Aws::Auth::AWSCredentials(auth_settings.access_key_id, auth_settings.secret_access_key, auth_settings.session_token);
         auto headers = auth_settings.headers;
 
         static constexpr size_t s3_max_redirects = 10;
@@ -98,9 +99,15 @@ void KeeperSnapshotManagerS3::updateS3Configuration(const Poco::Util::AbstractCo
 
         client_configuration.endpointOverride = new_uri.endpoint;
 
+        S3::ClientSettings client_settings{
+            .use_virtual_addressing = new_uri.is_virtual_hosted_style,
+            .disable_checksum = false,
+            .gcs_issue_compose_request = false,
+        };
+
         auto client = S3::ClientFactory::instance().create(
             client_configuration,
-            new_uri.is_virtual_hosted_style,
+            client_settings,
             credentials.GetAWSAccessKeyId(),
             credentials.GetAWSSecretKey(),
             auth_settings.server_side_encryption_customer_key_base64,
@@ -207,6 +214,9 @@ void KeeperSnapshotManagerS3::uploadSnapshotImpl(const SnapshotFileInfo & snapsh
             return;
         }
 
+        /// To avoid reference to binding
+        const auto & snapshot_path_ref = snapshot_path;
+
         SCOPE_EXIT(
         {
             LOG_INFO(log, "Removing lock file");
@@ -222,7 +232,7 @@ void KeeperSnapshotManagerS3::uploadSnapshotImpl(const SnapshotFileInfo & snapsh
             }
             catch (...)
             {
-                LOG_INFO(log, "Failed to delete lock file for {} from S3", snapshot_file_info.path);
+                LOG_INFO(log, "Failed to delete lock file for {} from S3", snapshot_path_ref);
                 tryLogCurrentException(__PRETTY_FUNCTION__);
             }
         });
diff --git a/src/Coordination/KeeperStorage.cpp b/src/Coordination/KeeperStorage.cpp
index 0d1d07ec7c5..41e6f5b5e2b 100644
--- a/src/Coordination/KeeperStorage.cpp
+++ b/src/Coordination/KeeperStorage.cpp
@@ -914,7 +914,7 @@ void KeeperStorage::unregisterEphemeralPath(int64_t session_id, const std::strin
 {
     auto ephemerals_it = ephemerals.find(session_id);
     if (ephemerals_it == ephemerals.end())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Session {} is missing ephemeral path");
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Session {} is missing ephemeral path", session_id);
 
     ephemerals_it->second.erase(path);
     if (ephemerals_it->second.empty())
diff --git a/src/Coordination/Standalone/Context.cpp b/src/Coordination/Standalone/Context.cpp
index dba4a8934b9..374610769c4 100644
--- a/src/Coordination/Standalone/Context.cpp
+++ b/src/Coordination/Standalone/Context.cpp
@@ -4,6 +4,7 @@
 #include <Common/Macros.h>
 #include <Common/ThreadPool.h>
 #include <Common/callOnce.h>
+#include <Disks/IO/IOUringReader.h>
 
 #include <Core/ServerSettings.h>
 
@@ -34,6 +35,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
+    extern const int UNSUPPORTED_METHOD;
 }
 
 struct ContextSharedPart : boost::noncopyable
@@ -62,6 +64,11 @@ struct ContextSharedPart : boost::noncopyable
     mutable std::unique_ptr<IAsynchronousReader> asynchronous_local_fs_reader;
     mutable std::unique_ptr<IAsynchronousReader> synchronous_local_fs_reader;
 
+#if USE_LIBURING
+    mutable OnceFlag io_uring_reader_initialized;
+    mutable std::unique_ptr<IOUringReader> io_uring_reader;
+#endif
+
     mutable OnceFlag threadpool_writer_initialized;
     mutable std::unique_ptr<ThreadPool> threadpool_writer;
 
@@ -225,6 +232,17 @@ IAsynchronousReader & Context::getThreadPoolReader(FilesystemReaderType type) co
     }
 }
 
+#if USE_LIBURING
+IOUringReader & Context::getIOURingReader() const
+{
+    callOnce(shared->io_uring_reader_initialized, [&] {
+        shared->io_uring_reader = std::make_unique<IOUringReader>(512);
+    });
+
+    return *shared->io_uring_reader;
+}
+#endif
+
 std::shared_ptr<FilesystemCacheLog> Context::getFilesystemCacheLog() const
 {
     return nullptr;
@@ -359,4 +377,9 @@ void Context::updateKeeperConfiguration([[maybe_unused]] const Poco::Util::Abstr
     shared->keeper_dispatcher->updateConfiguration(getConfigRef(), getMacros());
 }
 
+std::shared_ptr<zkutil::ZooKeeper> Context::getZooKeeper() const
+{
+    throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "Cannot connect to ZooKeeper from Keeper");
+}
+
 }
diff --git a/src/Coordination/Standalone/Context.h b/src/Coordination/Standalone/Context.h
index 7555618233d..a6199864422 100644
--- a/src/Coordination/Standalone/Context.h
+++ b/src/Coordination/Standalone/Context.h
@@ -20,6 +20,13 @@
 
 #include <memory>
 
+#include "config.h"
+namespace zkutil
+{
+    class ZooKeeper;
+    using ZooKeeperPtr = std::shared_ptr<ZooKeeper>;
+}
+
 namespace DB
 {
 
@@ -28,6 +35,7 @@ class Macros;
 class FilesystemCacheLog;
 class FilesystemReadPrefetchesLog;
 class BlobStorageLog;
+class IOUringReader;
 
 /// A small class which owns ContextShared.
 /// We don't use something like unique_ptr directly to allow ContextShared type to be incomplete.
@@ -127,6 +135,9 @@ public:
     ApplicationType getApplicationType() const { return ApplicationType::KEEPER; }
 
     IAsynchronousReader & getThreadPoolReader(FilesystemReaderType type) const;
+#if USE_LIBURING
+    IOUringReader & getIOURingReader() const;
+#endif
     std::shared_ptr<AsyncReadCounters> getAsyncReadCounters() const;
     ThreadPool & getThreadPoolWriter() const;
 
@@ -147,6 +158,8 @@ public:
     void initializeKeeperDispatcher(bool start_async) const;
     void shutdownKeeperDispatcher() const;
     void updateKeeperConfiguration(const Poco::Util::AbstractConfiguration & config);
+
+    zkutil::ZooKeeperPtr getZooKeeper() const;
 };
 
 }
diff --git a/src/Coordination/tests/gtest_coordination.cpp b/src/Coordination/tests/gtest_coordination.cpp
index 2b5fd3424c0..dd19f0b9967 100644
--- a/src/Coordination/tests/gtest_coordination.cpp
+++ b/src/Coordination/tests/gtest_coordination.cpp
@@ -1000,7 +1000,7 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate)
     EXPECT_TRUE(fs::exists("./logs/changelog_31_35.bin" + params.extension));
 
     DB::WriteBufferFromFile plain_buf(
-        "./logs/changelog_11_15.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
+        "./logs/changelog_11_15.bin" + params.extension, DB::DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
     plain_buf.truncate(0);
 
     DB::KeeperLogStore changelog_reader(
@@ -1073,7 +1073,7 @@ TEST_P(CoordinationTest, ChangelogTestReadAfterBrokenTruncate2)
     EXPECT_TRUE(fs::exists("./logs/changelog_21_40.bin" + params.extension));
 
     DB::WriteBufferFromFile plain_buf(
-        "./logs/changelog_1_20.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
+        "./logs/changelog_1_20.bin" + params.extension, DB::DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
     plain_buf.truncate(30);
 
     DB::KeeperLogStore changelog_reader(
@@ -1130,7 +1130,7 @@ TEST_F(CoordinationTest, ChangelogTestReadAfterBrokenTruncate3)
     EXPECT_TRUE(fs::exists("./logs/changelog_21_40.bin"));
 
     DB::WriteBufferFromFile plain_buf(
-        "./logs/changelog_1_20.bin", DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
+        "./logs/changelog_1_20.bin", DB::DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
     plain_buf.truncate(plain_buf.size() - 30);
 
     DB::KeeperLogStore changelog_reader(
@@ -1733,7 +1733,7 @@ TEST_P(CoordinationTest, TestStorageSnapshotBroken)
 
     /// Let's corrupt file
     DB::WriteBufferFromFile plain_buf(
-        "./snapshots/snapshot_50.bin" + params.extension, DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
+        "./snapshots/snapshot_50.bin" + params.extension, DB::DBMS_DEFAULT_BUFFER_SIZE, O_APPEND | O_CREAT | O_WRONLY);
     plain_buf.truncate(34);
     plain_buf.sync();
 
@@ -2770,7 +2770,7 @@ TEST_P(CoordinationTest, TestDurableState)
     {
         SCOPED_TRACE("Read from corrupted file");
         state_manager.reset();
-        DB::WriteBufferFromFile write_buf("./state", DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY);
+        DB::WriteBufferFromFile write_buf("./state", DB::DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY);
         write_buf.seek(20, SEEK_SET);
         DB::writeIntBinary(31, write_buf);
         write_buf.sync();
@@ -2787,7 +2787,7 @@ TEST_P(CoordinationTest, TestDurableState)
         SCOPED_TRACE("Read from file with invalid size");
         state_manager.reset();
 
-        DB::WriteBufferFromFile write_buf("./state", DBMS_DEFAULT_BUFFER_SIZE, O_TRUNC | O_CREAT | O_WRONLY);
+        DB::WriteBufferFromFile write_buf("./state", DB::DBMS_DEFAULT_BUFFER_SIZE, O_TRUNC | O_CREAT | O_WRONLY);
         DB::writeIntBinary(20, write_buf);
         write_buf.sync();
         write_buf.close();
diff --git a/src/Core/BackgroundSchedulePool.cpp b/src/Core/BackgroundSchedulePool.cpp
index ec1ae047d05..fa892bc3c84 100644
--- a/src/Core/BackgroundSchedulePool.cpp
+++ b/src/Core/BackgroundSchedulePool.cpp
@@ -31,7 +31,7 @@ bool BackgroundSchedulePoolTaskInfo::schedule()
     return true;
 }
 
-bool BackgroundSchedulePoolTaskInfo::scheduleAfter(size_t milliseconds, bool overwrite)
+bool BackgroundSchedulePoolTaskInfo::scheduleAfter(size_t milliseconds, bool overwrite, bool only_if_scheduled)
 {
     std::lock_guard lock(schedule_mutex);
 
@@ -39,6 +39,8 @@ bool BackgroundSchedulePoolTaskInfo::scheduleAfter(size_t milliseconds, bool ove
         return false;
     if (delayed && !overwrite)
         return false;
+    if (!delayed && only_if_scheduled)
+        return false;
 
     pool.scheduleDelayedTask(shared_from_this(), milliseconds, lock);
     return true;
diff --git a/src/Core/BackgroundSchedulePool.h b/src/Core/BackgroundSchedulePool.h
index e97b02e976f..eca93353283 100644
--- a/src/Core/BackgroundSchedulePool.h
+++ b/src/Core/BackgroundSchedulePool.h
@@ -106,8 +106,10 @@ public:
     bool schedule();
 
     /// Schedule for execution after specified delay.
-    /// If overwrite is set then the task will be re-scheduled (if it was already scheduled, i.e. delayed == true).
-    bool scheduleAfter(size_t milliseconds, bool overwrite = true);
+    /// If overwrite is set, and the task is already scheduled with a delay (delayed == true),
+    /// the task will be re-scheduled with the new delay.
+    /// If only_if_scheduled is set, don't do anything unless the task is already scheduled with a delay.
+    bool scheduleAfter(size_t milliseconds, bool overwrite = true, bool only_if_scheduled = false);
 
     /// Further attempts to schedule become no-op. Will wait till the end of the current execution of the task.
     void deactivate();
diff --git a/src/Core/Defines.h b/src/Core/Defines.h
index e2ffc2b7d7a..a3ab76c0b93 100644
--- a/src/Core/Defines.h
+++ b/src/Core/Defines.h
@@ -3,66 +3,70 @@
 #include <base/defines.h>
 #include <base/unit.h>
 
-#define DBMS_DEFAULT_PORT 9000
-#define DBMS_DEFAULT_SECURE_PORT 9440
-#define DBMS_DEFAULT_CONNECT_TIMEOUT_SEC 10
-#define DBMS_DEFAULT_SEND_TIMEOUT_SEC 300
-#define DBMS_DEFAULT_RECEIVE_TIMEOUT_SEC 300
+namespace DB
+{
+
+static constexpr auto DBMS_DEFAULT_PORT = 9000;
+static constexpr auto DBMS_DEFAULT_SECURE_PORT = 9440;
+static constexpr auto DBMS_DEFAULT_CONNECT_TIMEOUT_SEC = 10;
+static constexpr auto DBMS_DEFAULT_SEND_TIMEOUT_SEC = 300;
+static constexpr auto DBMS_DEFAULT_RECEIVE_TIMEOUT_SEC = 300;
 /// Timeout for synchronous request-result protocol call (like Ping or TablesStatus).
-#define DBMS_DEFAULT_SYNC_REQUEST_TIMEOUT_SEC 5
-#define DBMS_DEFAULT_POLL_INTERVAL 10
+static constexpr auto DBMS_DEFAULT_SYNC_REQUEST_TIMEOUT_SEC = 5;
+static constexpr auto DBMS_DEFAULT_POLL_INTERVAL = 10;
 
 /// The size of the I/O buffer by default.
-#define DBMS_DEFAULT_BUFFER_SIZE 1048576ULL
+static constexpr auto DBMS_DEFAULT_BUFFER_SIZE = 1048576ULL;
 
-#define PADDING_FOR_SIMD 64
+static constexpr auto PADDING_FOR_SIMD = 64;
 
 /** Which blocks by default read the data (by number of rows).
   * Smaller values give better cache locality, less consumption of RAM, but more overhead to process the query.
   */
-#define DEFAULT_BLOCK_SIZE 65409 /// 65536 - PADDING_FOR_SIMD - (PADDING_FOR_SIMD - 1) bytes padding that we usually have in arrays
+static constexpr auto DEFAULT_BLOCK_SIZE
+    = 65409; /// 65536 - PADDING_FOR_SIMD - (PADDING_FOR_SIMD - 1) bytes padding that we usually have in = arrays
 
 /** Which blocks should be formed for insertion into the table, if we control the formation of blocks.
   * (Sometimes the blocks are inserted exactly such blocks that have been read / transmitted from the outside, and this parameter does not affect their size.)
   * More than DEFAULT_BLOCK_SIZE, because in some tables a block of data on the disk is created for each block (quite a big thing),
   *  and if the parts were small, then it would be costly then to combine them.
   */
-#define DEFAULT_INSERT_BLOCK_SIZE \
-    1048449 /// 1048576 - PADDING_FOR_SIMD - (PADDING_FOR_SIMD - 1) bytes padding that we usually have in arrays
+static constexpr auto DEFAULT_INSERT_BLOCK_SIZE
+    = 1048449; /// 1048576 - PADDING_FOR_SIMD - (PADDING_FOR_SIMD - 1) bytes padding that we usually have in arrays
 
-#define DEFAULT_PERIODIC_LIVE_VIEW_REFRESH_SEC 60
-#define SHOW_CHARS_ON_SYNTAX_ERROR ptrdiff_t(160)
+static constexpr auto DEFAULT_PERIODIC_LIVE_VIEW_REFRESH_SEC = 60;
+static constexpr auto SHOW_CHARS_ON_SYNTAX_ERROR = ptrdiff_t(160);
 /// each period reduces the error counter by 2 times
 /// too short a period can cause errors to disappear immediately after creation.
-#define DBMS_CONNECTION_POOL_WITH_FAILOVER_DEFAULT_DECREASE_ERROR_PERIOD 60
+static constexpr auto DBMS_CONNECTION_POOL_WITH_FAILOVER_DEFAULT_DECREASE_ERROR_PERIOD = 60;
 /// replica error max cap, this is to prevent replica from accumulating too many errors and taking to long to recover.
-#define DBMS_CONNECTION_POOL_WITH_FAILOVER_MAX_ERROR_COUNT 1000
+static constexpr auto DBMS_CONNECTION_POOL_WITH_FAILOVER_MAX_ERROR_COUNT = 1000;
 
 /// The boundary on which the blocks for asynchronous file operations should be aligned.
-#define DEFAULT_AIO_FILE_BLOCK_SIZE 4096
+static constexpr auto DEFAULT_AIO_FILE_BLOCK_SIZE = 4096;
 
-#define DEFAULT_HTTP_READ_BUFFER_TIMEOUT 30
-#define DEFAULT_HTTP_READ_BUFFER_CONNECTION_TIMEOUT 1
+static constexpr auto DEFAULT_HTTP_READ_BUFFER_TIMEOUT = 30;
+static constexpr auto DEFAULT_HTTP_READ_BUFFER_CONNECTION_TIMEOUT = 1;
 /// Maximum number of http-connections between two endpoints
 /// the number is unmotivated
-#define DEFAULT_COUNT_OF_HTTP_CONNECTIONS_PER_ENDPOINT 15
+static constexpr auto DEFAULT_COUNT_OF_HTTP_CONNECTIONS_PER_ENDPOINT = 15;
 
-#define DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT 30
+static constexpr auto DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT = 30;
 
-#define DBMS_DEFAULT_PATH "/var/lib/clickhouse/"
+static constexpr auto DBMS_DEFAULT_PATH = "/var/lib/clickhouse/";
 
 /// Actually, there may be multiple acquisitions of different locks for a given table within one query.
 /// Check with IStorage class for the list of possible locks
-#define DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC 120
+static constexpr auto DBMS_DEFAULT_LOCK_ACQUIRE_TIMEOUT_SEC = 120;
 
 /// Default limit on recursion depth of recursive descend parser.
-#define DBMS_DEFAULT_MAX_PARSER_DEPTH 1000
+static constexpr auto DBMS_DEFAULT_MAX_PARSER_DEPTH = 1000;
 
 /// Default limit on query size.
-#define DBMS_DEFAULT_MAX_QUERY_SIZE 262144
+static constexpr auto DBMS_DEFAULT_MAX_QUERY_SIZE = 262144;
 
 /// Max depth of hierarchical dictionary
-#define DBMS_HIERARCHICAL_DICTIONARY_MAX_DEPTH 1000
+static constexpr auto DBMS_HIERARCHICAL_DICTIONARY_MAX_DEPTH = 1000;
 
 /// Default maximum (total and entry) sizes and policies of various caches
 static constexpr auto DEFAULT_UNCOMPRESSED_CACHE_POLICY = "SLRU";
@@ -95,7 +99,9 @@ static constexpr auto DEFAULT_QUERY_CACHE_MAX_ENTRY_SIZE_IN_ROWS = 30'000'000uz;
 ///
 /// Look at compiler-rt/lib/sanitizer_common/sanitizer_stacktrace.h
 #if !defined(SANITIZER)
-#define QUERY_PROFILER_DEFAULT_SAMPLE_RATE_NS 1000000000
+static constexpr auto QUERY_PROFILER_DEFAULT_SAMPLE_RATE_NS = 1000000000;
 #else
-#define QUERY_PROFILER_DEFAULT_SAMPLE_RATE_NS 0
+static constexpr auto QUERY_PROFILER_DEFAULT_SAMPLE_RATE_NS = 0;
 #endif
+
+}
diff --git a/src/Core/ExternalResultDescription.cpp b/src/Core/ExternalResultDescription.cpp
index 0700200a9ec..f7e8a69d355 100644
--- a/src/Core/ExternalResultDescription.cpp
+++ b/src/Core/ExternalResultDescription.cpp
@@ -20,6 +20,11 @@ namespace ErrorCodes
     extern const int UNKNOWN_TYPE;
 }
 
+ExternalResultDescription::ExternalResultDescription(const Block & sample_block_)
+{
+    init(sample_block_);
+}
+
 void ExternalResultDescription::init(const Block & sample_block_)
 {
     sample_block = sample_block_;
diff --git a/src/Core/ExternalResultDescription.h b/src/Core/ExternalResultDescription.h
index a9ffe8b2ed2..b7d852b99cf 100644
--- a/src/Core/ExternalResultDescription.h
+++ b/src/Core/ExternalResultDescription.h
@@ -41,6 +41,9 @@ struct ExternalResultDescription
     Block sample_block;
     std::vector<std::pair<ValueType, bool /* is_nullable */>> types;
 
+    ExternalResultDescription() = default;
+    explicit ExternalResultDescription(const Block & sample_block_);
+
     void init(const Block & sample_block_);
 };
 
diff --git a/src/Core/Field.h b/src/Core/Field.h
index e77217abc03..6afa98ed9c0 100644
--- a/src/Core/Field.h
+++ b/src/Core/Field.h
@@ -122,7 +122,7 @@ struct CustomType
     bool isSecret() const { return impl->isSecret(); }
     const char * getTypeName() const { return impl->getTypeName(); }
     String toString(bool show_secrets = true) const { return impl->toString(show_secrets); }
-    const CustomTypeImpl & getImpl() { return *impl; }
+    const CustomTypeImpl & getImpl() const { return *impl; }
 
     bool operator < (const CustomType & rhs) const { return *impl < *rhs.impl; }
     bool operator <= (const CustomType & rhs) const { return *impl <= *rhs.impl; }
@@ -292,7 +292,7 @@ concept not_field_or_bool_or_stringlike
 /** 32 is enough. Round number is used for alignment and for better arithmetic inside std::vector.
   * NOTE: Actually, sizeof(std::string) is 32 when using libc++, so Field is 40 bytes.
   */
-#define DBMS_MIN_FIELD_SIZE 32
+static constexpr auto DBMS_MIN_FIELD_SIZE = 32;
 
 
 /** Discriminated union of several types.
diff --git a/src/Core/InterpolateDescription.cpp b/src/Core/InterpolateDescription.cpp
index e7b74716b79..d828c2e85e9 100644
--- a/src/Core/InterpolateDescription.cpp
+++ b/src/Core/InterpolateDescription.cpp
@@ -3,10 +3,16 @@
 #include <Common/JSONBuilder.h>
 #include <Core/InterpolateDescription.h>
 #include <Interpreters/convertFieldToType.h>
+#include <Core/SettingsEnums.h>
+#include <Common/IntervalKind.h>
+#include <Parsers/ASTOrderByElement.h>
+#include <Parsers/ASTInterpolateElement.h>
+#include <Interpreters/Aliases.h>
+#include <Interpreters/ActionsDAG.h>
+
 
 namespace DB
 {
-
     InterpolateDescription::InterpolateDescription(ActionsDAGPtr actions_, const Aliases & aliases)
         : actions(actions_)
     {
@@ -28,5 +34,4 @@ namespace DB
             result_columns_order.push_back(name);
         }
     }
-
 }
diff --git a/src/Core/InterpolateDescription.h b/src/Core/InterpolateDescription.h
index 8aabce1470e..62d7120508b 100644
--- a/src/Core/InterpolateDescription.h
+++ b/src/Core/InterpolateDescription.h
@@ -2,20 +2,18 @@
 
 #include <unordered_map>
 #include <memory>
-#include <cstddef>
 #include <string>
-#include <Core/Field.h>
-#include <Core/SettingsEnums.h>
-#include <Common/IntervalKind.h>
-#include <Parsers/ASTOrderByElement.h>
-#include <Parsers/ASTInterpolateElement.h>
-#include <Functions/FunctionsMiscellaneous.h>
-#include <Interpreters/Aliases.h>
+#include <Core/NamesAndTypes.h>
+#include <Parsers/IAST_fwd.h>
 
 
 namespace DB
 {
 
+class ActionsDAG;
+using ActionsDAGPtr = std::shared_ptr<ActionsDAG>;
+using Aliases = std::unordered_map<String, ASTPtr>;
+
 /// Interpolate description
 struct InterpolateDescription
 {
diff --git a/src/Core/Joins.cpp b/src/Core/Joins.cpp
index 9c8ece82224..77568223d71 100644
--- a/src/Core/Joins.cpp
+++ b/src/Core/Joins.cpp
@@ -13,6 +13,7 @@ const char * toString(JoinKind kind)
         case JoinKind::Full: return "FULL";
         case JoinKind::Cross: return "CROSS";
         case JoinKind::Comma: return "COMMA";
+        case JoinKind::Paste: return "PASTE";
     }
 };
 
diff --git a/src/Core/Joins.h b/src/Core/Joins.h
index 6884e8dfd9a..cc69f07263d 100644
--- a/src/Core/Joins.h
+++ b/src/Core/Joins.h
@@ -13,7 +13,8 @@ enum class JoinKind
     Right,
     Full,
     Cross, /// Direct product. Strictness and condition doesn't matter.
-    Comma /// Same as direct product. Intended to be converted to INNER JOIN with conditions from WHERE.
+    Comma, /// Same as direct product. Intended to be converted to INNER JOIN with conditions from WHERE.
+    Paste, /// Used to join parts without `ON` clause.
 };
 
 const char * toString(JoinKind kind);
@@ -27,6 +28,7 @@ inline constexpr bool isRightOrFull(JoinKind kind)  { return kind == JoinKind::R
 inline constexpr bool isLeftOrFull(JoinKind kind)   { return kind == JoinKind::Left  || kind == JoinKind::Full; }
 inline constexpr bool isInnerOrRight(JoinKind kind) { return kind == JoinKind::Inner || kind == JoinKind::Right; }
 inline constexpr bool isInnerOrLeft(JoinKind kind)  { return kind == JoinKind::Inner || kind == JoinKind::Left; }
+inline constexpr bool isPaste(JoinKind kind)        { return kind == JoinKind::Paste; }
 
 /// Allows more optimal JOIN for typical cases.
 enum class JoinStrictness
diff --git a/src/Core/MySQL/MySQLCharset.cpp b/src/Core/MySQL/MySQLCharset.cpp
index 0acf3f130a6..d8e68565f3d 100644
--- a/src/Core/MySQL/MySQLCharset.cpp
+++ b/src/Core/MySQL/MySQLCharset.cpp
@@ -5,13 +5,16 @@
 
 #if USE_ICU
 #include <unicode/ucnv.h>
-#define CHUNK_SIZE 1024
-static const char * TARGET_CHARSET = "utf8";
 #endif
 
 namespace DB
 {
 
+#if USE_ICU
+static constexpr auto CHUNK_SIZE = 1024;
+static constexpr auto TARGET_CHARSET = "utf8";
+#endif
+
 namespace ErrorCodes
 {
     extern const int UNKNOWN_EXCEPTION;
diff --git a/src/Core/PostgreSQL/insertPostgreSQLValue.cpp b/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
index d2e8071c5de..2f041134f06 100644
--- a/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
+++ b/src/Core/PostgreSQL/insertPostgreSQLValue.cpp
@@ -36,7 +36,7 @@ void insertDefaultPostgreSQLValue(IColumn & column, const IColumn & sample_colum
 void insertPostgreSQLValue(
         IColumn & column, std::string_view value,
         const ExternalResultDescription::ValueType type, const DataTypePtr data_type,
-        std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t idx)
+        const std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t idx)
 {
     switch (type)
     {
@@ -125,8 +125,8 @@ void insertPostgreSQLValue(
             pqxx::array_parser parser{value};
             std::pair<pqxx::array_parser::juncture, std::string> parsed = parser.get_next();
 
-            size_t dimension = 0, max_dimension = 0, expected_dimensions = array_info[idx].num_dimensions;
-            const auto parse_value = array_info[idx].pqxx_parser;
+            size_t dimension = 0, max_dimension = 0, expected_dimensions = array_info.at(idx).num_dimensions;
+            const auto parse_value = array_info.at(idx).pqxx_parser;
             std::vector<Row> dimensions(expected_dimensions + 1);
 
             while (parsed.first != pqxx::array_parser::juncture::done)
@@ -138,7 +138,7 @@ void insertPostgreSQLValue(
                     dimensions[dimension].emplace_back(parse_value(parsed.second));
 
                 else if (parsed.first == pqxx::array_parser::juncture::null_value)
-                    dimensions[dimension].emplace_back(array_info[idx].default_value);
+                    dimensions[dimension].emplace_back(array_info.at(idx).default_value);
 
                 else if (parsed.first == pqxx::array_parser::juncture::row_end)
                 {
diff --git a/src/Core/PostgreSQL/insertPostgreSQLValue.h b/src/Core/PostgreSQL/insertPostgreSQLValue.h
index b842d86ed47..3bc83292b96 100644
--- a/src/Core/PostgreSQL/insertPostgreSQLValue.h
+++ b/src/Core/PostgreSQL/insertPostgreSQLValue.h
@@ -23,7 +23,7 @@ struct PostgreSQLArrayInfo
 void insertPostgreSQLValue(
         IColumn & column, std::string_view value,
         const ExternalResultDescription::ValueType type, const DataTypePtr data_type,
-        std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t idx);
+        const std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t idx);
 
 void preparePostgreSQLArrayInfo(
         std::unordered_map<size_t, PostgreSQLArrayInfo> & array_info, size_t column_idx, const DataTypePtr data_type);
diff --git a/src/Core/ProtocolDefines.h b/src/Core/ProtocolDefines.h
index 0e2e5b3dc60..058c6fdc903 100644
--- a/src/Core/ProtocolDefines.h
+++ b/src/Core/ProtocolDefines.h
@@ -1,77 +1,80 @@
 #pragma once
 
-#define DBMS_MIN_REVISION_WITH_CLIENT_INFO 54032
-#define DBMS_MIN_REVISION_WITH_SERVER_TIMEZONE 54058
-#define DBMS_MIN_REVISION_WITH_QUOTA_KEY_IN_CLIENT_INFO 54060
-#define DBMS_MIN_REVISION_WITH_TABLES_STATUS 54226
-#define DBMS_MIN_REVISION_WITH_TIME_ZONE_PARAMETER_IN_DATETIME_DATA_TYPE 54337
-#define DBMS_MIN_REVISION_WITH_SERVER_DISPLAY_NAME 54372
-#define DBMS_MIN_REVISION_WITH_VERSION_PATCH 54401
-#define DBMS_MIN_REVISION_WITH_SERVER_LOGS 54406
+namespace DB
+{
+
+static constexpr auto DBMS_MIN_REVISION_WITH_CLIENT_INFO = 54032;
+static constexpr auto DBMS_MIN_REVISION_WITH_SERVER_TIMEZONE = 54058;
+static constexpr auto DBMS_MIN_REVISION_WITH_QUOTA_KEY_IN_CLIENT_INFO = 54060;
+static constexpr auto DBMS_MIN_REVISION_WITH_TABLES_STATUS = 54226;
+static constexpr auto DBMS_MIN_REVISION_WITH_TIME_ZONE_PARAMETER_IN_DATETIME_DATA_TYPE = 54337;
+static constexpr auto DBMS_MIN_REVISION_WITH_SERVER_DISPLAY_NAME = 54372;
+static constexpr auto DBMS_MIN_REVISION_WITH_VERSION_PATCH = 54401;
+static constexpr auto DBMS_MIN_REVISION_WITH_SERVER_LOGS = 54406;
 /// Minimum revision with exactly the same set of aggregation methods and rules to select them.
 /// Two-level (bucketed) aggregation is incompatible if servers are inconsistent in these rules
 /// (keys will be placed in different buckets and result will not be fully aggregated).
-#define DBMS_MIN_REVISION_WITH_CURRENT_AGGREGATION_VARIANT_SELECTION_METHOD 54448
-#define DBMS_MIN_MAJOR_VERSION_WITH_CURRENT_AGGREGATION_VARIANT_SELECTION_METHOD 21
-#define DBMS_MIN_MINOR_VERSION_WITH_CURRENT_AGGREGATION_VARIANT_SELECTION_METHOD 4
-#define DBMS_MIN_REVISION_WITH_COLUMN_DEFAULTS_METADATA 54410
+static constexpr auto DBMS_MIN_REVISION_WITH_CURRENT_AGGREGATION_VARIANT_SELECTION_METHOD = 54448;
+static constexpr auto DBMS_MIN_MAJOR_VERSION_WITH_CURRENT_AGGREGATION_VARIANT_SELECTION_METHOD = 21;
+static constexpr auto DBMS_MIN_MINOR_VERSION_WITH_CURRENT_AGGREGATION_VARIANT_SELECTION_METHOD = 4;
+static constexpr auto DBMS_MIN_REVISION_WITH_COLUMN_DEFAULTS_METADATA = 54410;
 
-#define DBMS_MIN_REVISION_WITH_LOW_CARDINALITY_TYPE 54405
-#define DBMS_MIN_REVISION_WITH_CLIENT_WRITE_INFO 54420
+static constexpr auto DBMS_MIN_REVISION_WITH_LOW_CARDINALITY_TYPE = 54405;
+static constexpr auto DBMS_MIN_REVISION_WITH_CLIENT_WRITE_INFO = 54420;
 
 /// Minimum revision supporting SettingsBinaryFormat::STRINGS.
-#define DBMS_MIN_REVISION_WITH_SETTINGS_SERIALIZED_AS_STRINGS 54429
-#define DBMS_MIN_REVISION_WITH_SCALARS 54429
+static constexpr auto DBMS_MIN_REVISION_WITH_SETTINGS_SERIALIZED_AS_STRINGS = 54429;
+static constexpr auto DBMS_MIN_REVISION_WITH_SCALARS = 54429;
 
 /// Minimum revision supporting OpenTelemetry
-#define DBMS_MIN_REVISION_WITH_OPENTELEMETRY 54442
+static constexpr auto DBMS_MIN_REVISION_WITH_OPENTELEMETRY = 54442;
 
-#define DBMS_MIN_REVISION_WITH_AGGREGATE_FUNCTIONS_VERSIONING 54452
+static constexpr auto DBMS_MIN_REVISION_WITH_AGGREGATE_FUNCTIONS_VERSIONING = 54452;
 
-#define DBMS_CLUSTER_PROCESSING_PROTOCOL_VERSION 1
+static constexpr auto DBMS_CLUSTER_PROCESSING_PROTOCOL_VERSION = 1;
 
-#define DBMS_PARALLEL_REPLICAS_PROTOCOL_VERSION 3
-#define DBMS_MIN_REVISION_WITH_PARALLEL_REPLICAS 54453
+static constexpr auto DBMS_PARALLEL_REPLICAS_PROTOCOL_VERSION = 3;
+static constexpr auto DBMS_MIN_REVISION_WITH_PARALLEL_REPLICAS = 54453;
 
-#define DBMS_MERGE_TREE_PART_INFO_VERSION 1
+static constexpr auto DBMS_MERGE_TREE_PART_INFO_VERSION = 1;
 
-#define DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET 54441
+static constexpr auto DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET = 54441;
 
-#define DBMS_MIN_REVISION_WITH_X_FORWARDED_FOR_IN_CLIENT_INFO 54443
-#define DBMS_MIN_REVISION_WITH_REFERER_IN_CLIENT_INFO 54447
+static constexpr auto DBMS_MIN_REVISION_WITH_X_FORWARDED_FOR_IN_CLIENT_INFO = 54443;
+static constexpr auto DBMS_MIN_REVISION_WITH_REFERER_IN_CLIENT_INFO = 54447;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_DISTRIBUTED_DEPTH 54448
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_DISTRIBUTED_DEPTH = 54448;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_INCREMENTAL_PROFILE_EVENTS 54451
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_INCREMENTAL_PROFILE_EVENTS = 54451;
 
-#define DBMS_MIN_REVISION_WITH_CUSTOM_SERIALIZATION 54454
+static constexpr auto DBMS_MIN_REVISION_WITH_CUSTOM_SERIALIZATION = 54454;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_INITIAL_QUERY_START_TIME 54449
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_INITIAL_QUERY_START_TIME = 54449;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_PROFILE_EVENTS_IN_INSERT 54456
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_PROFILE_EVENTS_IN_INSERT = 54456;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_VIEW_IF_PERMITTED 54457
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_VIEW_IF_PERMITTED = 54457;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_ADDENDUM 54458
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_ADDENDUM = 54458;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_QUOTA_KEY 54458
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_QUOTA_KEY = 54458;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_PARAMETERS 54459
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_PARAMETERS = 54459;
 
 /// The server will send query elapsed run time in the Progress packet.
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_SERVER_QUERY_TIME_IN_PROGRESS 54460
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_SERVER_QUERY_TIME_IN_PROGRESS = 54460;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_PASSWORD_COMPLEXITY_RULES 54461
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_PASSWORD_COMPLEXITY_RULES = 54461;
 
-#define DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET_V2 54462
+static constexpr auto DBMS_MIN_REVISION_WITH_INTERSERVER_SECRET_V2 = 54462;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_TOTAL_BYTES_IN_PROGRESS 54463
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_TOTAL_BYTES_IN_PROGRESS = 54463;
 
-#define DBMS_MIN_PROTOCOL_VERSION_WITH_TIMEZONE_UPDATES 54464
+static constexpr auto DBMS_MIN_PROTOCOL_VERSION_WITH_TIMEZONE_UPDATES = 54464;
 
-#define DBMS_MIN_REVISION_WITH_SPARSE_SERIALIZATION 54465
+static constexpr auto DBMS_MIN_REVISION_WITH_SPARSE_SERIALIZATION = 54465;
 
-#define DBMS_MIN_REVISION_WITH_SSH_AUTHENTICATION 54466
+static constexpr auto DBMS_MIN_REVISION_WITH_SSH_AUTHENTICATION = 54466;
 
 /// Version of ClickHouse TCP protocol.
 ///
@@ -80,4 +83,6 @@
 /// NOTE: DBMS_TCP_PROTOCOL_VERSION has nothing common with VERSION_REVISION,
 /// later is just a number for server version (one number instead of commit SHA)
 /// for simplicity (sometimes it may be more convenient in some use cases).
-#define DBMS_TCP_PROTOCOL_VERSION 54466
+static constexpr auto DBMS_TCP_PROTOCOL_VERSION = 54466;
+
+}
diff --git a/src/Core/ServerSettings.h b/src/Core/ServerSettings.h
index 77015c78a04..85e3d33f80b 100644
--- a/src/Core/ServerSettings.h
+++ b/src/Core/ServerSettings.h
@@ -79,6 +79,9 @@ namespace DB
     \
     M(UInt64, max_table_size_to_drop, 50000000000lu, "If size of a table is greater than this value (in bytes) than table could not be dropped with any DROP query.", 0) \
     M(UInt64, max_partition_size_to_drop, 50000000000lu, "Same as max_table_size_to_drop, but for the partitions.", 0) \
+    M(UInt64, max_table_num_to_warn, 5000lu, "If number of tables is greater than this value, server will create a warning that will displayed to user.", 0) \
+    M(UInt64, max_database_num_to_warn, 1000lu, "If number of databases is greater than this value, server will create a warning that will displayed to user.", 0) \
+    M(UInt64, max_part_num_to_warn, 100000lu, "If number of databases is greater than this value, server will create a warning that will displayed to user.", 0) \
     M(UInt64, concurrent_threads_soft_limit_num, 0, "Sets how many concurrent thread can be allocated before applying CPU pressure. Zero means unlimited.", 0) \
     M(UInt64, concurrent_threads_soft_limit_ratio_to_cores, 0, "Same as concurrent_threads_soft_limit_num, but with ratio to cores.", 0) \
     \
@@ -97,12 +100,14 @@ namespace DB
     M(Bool, async_load_databases, false, "Enable asynchronous loading of databases and tables to speedup server startup. Queries to not yet loaded entity will be blocked until load is finished.", 0) \
     M(Bool, display_secrets_in_show_and_select, false, "Allow showing secrets in SHOW and SELECT queries via a format setting and a grant", 0) \
     \
+    M(Seconds, keep_alive_timeout, DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT, "The number of seconds that ClickHouse waits for incoming requests before closing the connection.", 0) \
+    M(Seconds, replicated_fetches_http_connection_timeout, 0, "HTTP connection timeout for part fetch requests. Inherited from default profile `http_connection_timeout` if not set explicitly.", 0) \
+    M(Seconds, replicated_fetches_http_send_timeout, 0, "HTTP send timeout for part fetch requests. Inherited from default profile `http_send_timeout` if not set explicitly.", 0) \
+    M(Seconds, replicated_fetches_http_receive_timeout, 0, "HTTP receive timeout for fetch part requests. Inherited from default profile `http_receive_timeout` if not set explicitly.", 0) \
     M(UInt64, total_memory_profiler_step, 0, "Whenever server memory usage becomes larger than every next step in number of bytes the memory profiler will collect the allocating stack trace. Zero means disabled memory profiler. Values lower than a few megabytes will slow down server.", 0) \
     M(Double, total_memory_tracker_sample_probability, 0, "Collect random allocations and deallocations and write them into system.trace_log with 'MemorySample' trace_type. The probability is for every alloc/free regardless to the size of the allocation (can be changed with `memory_profiler_sample_min_allocation_size` and `memory_profiler_sample_max_allocation_size`). Note that sampling happens only when the amount of untracked memory exceeds 'max_untracked_memory'. You may want to set 'max_untracked_memory' to 0 for extra fine grained sampling.", 0) \
     M(UInt64, total_memory_profiler_sample_min_allocation_size, 0, "Collect random allocations of size greater or equal than specified value with probability equal to `total_memory_profiler_sample_probability`. 0 means disabled. You may want to set 'max_untracked_memory' to 0 to make this threshold to work as expected.", 0) \
     M(UInt64, total_memory_profiler_sample_max_allocation_size, 0, "Collect random allocations of size less or equal than specified value with probability equal to `total_memory_profiler_sample_probability`. 0 means disabled. You may want to set 'max_untracked_memory' to 0 to make this threshold to work as expected.", 0) \
-    M(String, get_client_http_header_forbidden_headers, "", "Comma separated list of http header names that will not be returned by function getClientHTTPHeader.", 0) \
-    M(Bool, allow_get_client_http_header, false, "Allow function getClientHTTPHeader", 0) \
     M(Bool, validate_tcp_client_information, false, "Validate client_information in the query packet over the native TCP protocol.", 0) \
     M(Bool, storage_metadata_write_full_object_key, false, "Write disk metadata files with VERSION_FULL_OBJECT_KEY format", 0) \
 
diff --git a/src/Core/Settings.cpp b/src/Core/Settings.cpp
index 33db7660abd..a38197b9eeb 100644
--- a/src/Core/Settings.cpp
+++ b/src/Core/Settings.cpp
@@ -90,7 +90,8 @@ void Settings::checkNoSettingNamesAtTopLevel(const Poco::Util::AbstractConfigura
     for (const auto & setting : settings.all())
     {
         const auto & name = setting.getName();
-        if (config.has(name) && !setting.isObsolete())
+        bool should_skip_check = name == "max_table_size_to_drop" || name == "max_partition_size_to_drop";
+        if (config.has(name) && !setting.isObsolete() && !should_skip_check)
         {
             throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG, "A setting '{}' appeared at top level in config {}."
                 " But it is user-level setting that should be located in users.xml inside <profiles> section for specific profile."
@@ -106,9 +107,7 @@ std::vector<String> Settings::getAllRegisteredNames() const
 {
     std::vector<String> all_settings;
     for (const auto & setting_field : all())
-    {
         all_settings.push_back(setting_field.getName());
-    }
     return all_settings;
 }
 
diff --git a/src/Core/Settings.h b/src/Core/Settings.h
index 14cd4f8de60..9516ef72077 100644
--- a/src/Core/Settings.h
+++ b/src/Core/Settings.h
@@ -104,9 +104,10 @@ class IColumn;
     M(Bool, s3_check_objects_after_upload, false, "Check each uploaded object to s3 with head request to be sure that upload was successful", 0) \
     M(Bool, s3_allow_parallel_part_upload, true, "Use multiple threads for s3 multipart upload. It may lead to slightly higher memory usage", 0) \
     M(Bool, s3_throw_on_zero_files_match, false, "Throw an error, when ListObjects request cannot match any files", 0) \
+    M(Bool, s3_disable_checksum, false, "Do not calculate a checksum when sending a file to S3. This speeds up writes by avoiding excessive processing passes on a file. It is mostly safe as the data of MergeTree tables is checksummed by ClickHouse anyway, and when S3 is accessed with HTTPS, the TLS layer already provides integrity while transferring through the network. While additional checksums on S3 give defense in depth.", 0) \
     M(UInt64, s3_retry_attempts, 100, "Setting for Aws::Client::RetryStrategy, Aws::Client does retries itself, 0 means no retries", 0) \
     M(UInt64, s3_request_timeout_ms, 30000, "Idleness timeout for sending and receiving data to/from S3. Fail if a single TCP read or write call blocks for this long.", 0) \
-    M(UInt64, s3_http_connection_pool_size, 1000, "How many reusable open connections to keep per S3 endpoint. Only applies to the S3 table engine and table function, not to S3 disks (for disks, use disk config instead). Global setting, can only be set in config, overriding it per session or per query has no effect.", 0) \
+    M(UInt64, s3_http_connection_pool_size, 1000, "How many reusable open connections to keep per S3 endpoint. This only applies to the S3 table engine and table function, not to S3 disks (for disks, use disk config instead). Global setting, can only be set in config, overriding it per session or per query has no effect.", 0) \
     M(Bool, enable_s3_requests_logging, false, "Enable very explicit logging of S3 requests. Makes sense for debug only.", 0) \
     M(String, s3queue_default_zookeeper_path, "/clickhouse/s3queue/", "Default zookeeper path prefix for S3Queue engine", 0) \
     M(Bool, s3queue_enable_logging_to_s3queue_log, false, "Enable writing to system.s3queue_log. The value can be overwritten per table with table settings", 0) \
@@ -122,10 +123,10 @@ class IColumn;
     M(UInt64, max_remote_write_network_bandwidth, 0, "The maximum speed of data exchange over the network in bytes per second for write.", 0) \
     M(UInt64, max_local_read_bandwidth, 0, "The maximum speed of local reads in bytes per second.", 0) \
     M(UInt64, max_local_write_bandwidth, 0, "The maximum speed of local writes in bytes per second.", 0) \
-    M(Bool, stream_like_engine_allow_direct_select, false, "Allow direct SELECT query for Kafka, RabbitMQ, FileLog, Redis Streams and NATS engines. In case there are attached materialized views, SELECT query is not allowed even if this setting is enabled.", 0) \
+    M(Bool, stream_like_engine_allow_direct_select, false, "Allow direct SELECT query for Kafka, RabbitMQ, FileLog, Redis Streams, and NATS engines. In case there are attached materialized views, SELECT query is not allowed even if this setting is enabled.", 0) \
     M(String, stream_like_engine_insert_queue, "", "When stream like engine reads from multiple queues, user will need to select one queue to insert into when writing. Used by Redis Streams and NATS.", 0) \
     \
-    M(Bool, distributed_foreground_insert, false, "If setting is enabled, insert query into distributed waits until data will be sent to all nodes in cluster. \n\nEnables or disables synchronous data insertion into a `Distributed` table.\n\nBy default, when inserting data into a Distributed table, the ClickHouse server sends data to cluster nodes in background. When `distributed_foreground_insert` = 1, the data is processed synchronously, and the `INSERT` operation succeeds only after all the data is saved on all shards (at least one replica for each shard if `internal_replication` is true).", 0) ALIAS(insert_distributed_sync) \
+    M(Bool, distributed_foreground_insert, false, "If setting is enabled, insert query into distributed waits until data are sent to all nodes in a cluster. \n\nEnables or disables synchronous data insertion into a `Distributed` table.\n\nBy default, when inserting data into a Distributed table, the ClickHouse server sends data to cluster nodes in the background. When `distributed_foreground_insert` = 1, the data is processed synchronously, and the `INSERT` operation succeeds only after all the data is saved on all shards (at least one replica for each shard if `internal_replication` is true).", 0) ALIAS(insert_distributed_sync) \
     M(UInt64, distributed_background_insert_timeout, 0, "Timeout for insert query into distributed. Setting is used only with insert_distributed_sync enabled. Zero value means no timeout.", 0) ALIAS(insert_distributed_timeout) \
     M(Milliseconds, distributed_background_insert_sleep_time_ms, 100, "Sleep time for background INSERTs into Distributed, in case of any errors delay grows exponentially.", 0) ALIAS(distributed_directory_monitor_sleep_time_ms) \
     M(Milliseconds, distributed_background_insert_max_sleep_time_ms, 30000, "Maximum sleep time for background INSERTs into Distributed, it limits exponential growth too.", 0) ALIAS(distributed_directory_monitor_max_sleep_time_ms) \
@@ -155,7 +156,8 @@ class IColumn;
     M(Bool, allow_suspicious_low_cardinality_types, false, "In CREATE TABLE statement allows specifying LowCardinality modifier for types of small fixed size (8 or less). Enabling this may increase merge times and memory consumption.", 0) \
     M(Bool, allow_suspicious_fixed_string_types, false, "In CREATE TABLE statement allows creating columns of type FixedString(n) with n > 256. FixedString with length >= 256 is suspicious and most likely indicates misusage", 0) \
     M(Bool, allow_suspicious_indices, false, "Reject primary/secondary indexes and sorting keys with identical expressions", 0) \
-    M(Bool, compile_expressions, false, "Compile some scalar functions and operators to native code.", 0) \
+    M(Bool, allow_suspicious_ttl_expressions, false, "Reject TTL expressions that don't depend on any of table's columns. It indicates a user error most of the time.", 0) \
+    M(Bool, compile_expressions, true, "Compile some scalar functions and operators to native code.", 0) \
     M(UInt64, min_count_to_compile_expression, 3, "The number of identical expressions before they are JIT-compiled", 0) \
     M(Bool, compile_aggregate_expressions, true, "Compile aggregate functions to native code.", 0) \
     M(UInt64, min_count_to_compile_aggregate_expression, 3, "The number of identical aggregate expressions before they are JIT-compiled", 0) \
@@ -184,7 +186,7 @@ class IColumn;
     M(Bool, parallel_replicas_for_non_replicated_merge_tree, false, "If true, ClickHouse will use parallel replicas algorithm also for non-replicated MergeTree tables", 0) \
     M(UInt64, parallel_replicas_min_number_of_rows_per_replica, 0, "Limit the number of replicas used in a query to (estimated rows to read / min_number_of_rows_per_replica). The max is still limited by 'max_parallel_replicas'", 0) \
     \
-    M(Bool, skip_unavailable_shards, false, "If true, ClickHouse silently skips unavailable shards and nodes unresolvable through DNS. Shard is marked as unavailable when none of the replicas can be reached.", 0) \
+    M(Bool, skip_unavailable_shards, false, "If true, ClickHouse silently skips unavailable shards. Shard is marked as unavailable when: 1) The shard cannot be reached due to a connection failure. 2) Shard is unresolvable through DNS. 3) Table does not exist on the shard.", 0) \
     \
     M(UInt64, parallel_distributed_insert_select, 0, "Process distributed INSERT SELECT query in the same cluster on local tables on every shard; if set to 1 - SELECT is executed on each shard; if set to 2 - SELECT and INSERT are executed on each shard", 0) \
     M(UInt64, distributed_group_by_no_merge, 0, "If 1, Do not merge aggregation states from different servers for distributed queries (shards will process query up to the Complete stage, initiator just proxies the data from the shards). If 2 the initiator will apply ORDER BY and LIMIT stages (it is not in case when shard process query up to the Complete stage)", 0) \
@@ -217,6 +219,7 @@ class IColumn;
     M(Bool, mysql_map_fixed_string_to_text_in_show_columns, false, "If enabled, FixedString type will be mapped to TEXT in SHOW [FULL] COLUMNS, BLOB otherwise.", 0) \
     \
     M(UInt64, optimize_min_equality_disjunction_chain_length, 3, "The minimum length of the expression `expr = x1 OR ... expr = xN` for optimization ", 0) \
+    M(UInt64, optimize_min_inequality_conjunction_chain_length, 3, "The minimum length of the expression `expr <> x1 AND ... expr <> xN` for optimization ", 0) \
     \
     M(UInt64, min_bytes_to_use_direct_io, 0, "The minimum number of bytes for reading the data with O_DIRECT option during SELECT queries execution. 0 - disabled.", 0) \
     M(UInt64, min_bytes_to_use_mmap_io, 0, "The minimum number of bytes for reading the data with mmap option during SELECT queries execution. 0 - disabled.", 0) \
@@ -336,6 +339,7 @@ class IColumn;
     M(UInt64, http_max_field_value_size, 128 * 1024, "Maximum length of field value in HTTP header", 0) \
     M(UInt64, http_max_chunk_size, 100_GiB, "Maximum value of a chunk size in HTTP chunked transfer encoding", 0) \
     M(Bool, http_skip_not_found_url_for_globs, true, "Skip url's for globs with HTTP_NOT_FOUND error", 0) \
+    M(Bool, http_make_head_request, true, "Allows the execution of a `HEAD` request while reading data from HTTP to retrieve information about the file to be read, such as its size", 0) \
     M(Bool, optimize_throw_if_noop, false, "If setting is enabled and OPTIMIZE query didn't actually assign a merge then an explanatory exception is thrown", 0) \
     M(Bool, use_index_for_in_with_subqueries, true, "Try using an index if there is a subquery or a table expression on the right side of the IN operator.", 0) \
     M(UInt64, use_index_for_in_with_subqueries_max_values, 0, "The maximum size of set in the right hand side of the IN operator to use table index for filtering. It allows to avoid performance degradation and higher memory usage due to preparation of additional data structures for large queries. Zero means no limit.", 0) \
@@ -525,6 +529,8 @@ class IColumn;
     M(Int64, max_partitions_to_read, -1, "Limit the max number of partitions that can be accessed in one query. <= 0 means unlimited.", 0) \
     M(Bool, check_query_single_value_result, true, "Return check query result as single 1/0 value", 0) \
     M(Bool, allow_drop_detached, false, "Allow ALTER TABLE ... DROP DETACHED PART[ITION] ... queries", 0) \
+    M(UInt64, max_table_size_to_drop, 50000000000lu, "If size of a table is greater than this value (in bytes) than table could not be dropped with any DROP query.", 0) \
+    M(UInt64, max_partition_size_to_drop, 50000000000lu, "Same as max_table_size_to_drop, but for the partitions.", 0) \
     \
     M(UInt64, postgresql_connection_pool_size, 16, "Connection pool size for PostgreSQL table engine and database engine.", 0) \
     M(UInt64, postgresql_connection_pool_wait_timeout, 5000, "Connection pool push/pop timeout on empty pool for PostgreSQL table engine and database engine. By default it will block on empty pool.", 0) \
@@ -578,6 +584,8 @@ class IColumn;
     M(Bool, enable_early_constant_folding, true, "Enable query optimization where we analyze function and subqueries results and rewrite query if there're constants there", 0) \
     M(Bool, deduplicate_blocks_in_dependent_materialized_views, false, "Should deduplicate blocks for materialized views if the block is not a duplicate for the table. Use true to always deduplicate in dependent tables.", 0) \
     M(Bool, materialized_views_ignore_errors, false, "Allows to ignore errors for MATERIALIZED VIEW, and deliver original block to the table regardless of MVs", 0) \
+    M(Bool, allow_experimental_refreshable_materialized_view, false, "Allow refreshable materialized views (CREATE MATERIALIZED VIEW <name> REFRESH ...).", 0) \
+    M(Bool, stop_refreshable_materialized_views_on_startup, false, "On server startup, prevent scheduling of refreshable materialized views, as if with SYSTEM STOP VIEWS. You can manually start them with SYSTEM START VIEWS or SYSTEM START VIEW <name> afterwards. Also applies to newly created views. Has no effect on non-refreshable materialized views.", 0) \
     M(Bool, use_compact_format_in_distributed_parts_names, true, "Changes format of directories names for distributed table insert parts.", 0) \
     M(Bool, validate_polygons, true, "Throw exception if polygon is invalid in function pointInPolygon (e.g. self-tangent, self-intersecting). If the setting is false, the function will accept invalid polygons but may silently return wrong result.", 0) \
     M(UInt64, max_parser_depth, DBMS_DEFAULT_MAX_PARSER_DEPTH, "Maximum parser depth (recursion depth of recursive descend parser).", 0) \
@@ -618,6 +626,7 @@ class IColumn;
     M(Bool, describe_include_subcolumns, false, "If true, subcolumns of all table columns will be included into result of DESCRIBE query", 0) \
     M(Bool, describe_include_virtual_columns, false, "If true, virtual columns of table will be included into result of DESCRIBE query", 0) \
     M(Bool, describe_compact_output, false, "If true, include only column names and types into result of DESCRIBE query", 0) \
+    M(Bool, apply_mutations_on_fly, false, "Only available in ClickHouse Cloud", 0) \
     M(Bool, mutations_execute_nondeterministic_on_initiator, false, "If true nondeterministic function are executed on initiator and replaced to literals in UPDATE and DELETE queries", 0) \
     M(Bool, mutations_execute_subqueries_on_initiator, false, "If true scalar subqueries are executed on initiator and replaced to literals in UPDATE and DELETE queries", 0) \
     M(UInt64, mutations_max_literal_size_to_replace, 16384, "The maximum size of serialized literal in bytes to replace in UPDATE and DELETE queries", 0) \
@@ -652,6 +661,7 @@ class IColumn;
     M(Bool, allow_aggregate_partitions_independently, false, "Enable independent aggregation of partitions on separate threads when partition key suits group by key. Beneficial when number of partitions close to number of cores and partitions have roughly the same size", 0) \
     M(Bool, force_aggregate_partitions_independently, false, "Force the use of optimization when it is applicable, but heuristics decided not to use it", 0) \
     M(UInt64, max_number_of_partitions_for_independent_aggregation, 128, "Maximal number of partitions in table to apply optimization", 0) \
+    M(Float, min_hit_rate_to_use_consecutive_keys_optimization, 0.5, "Minimal hit rate of a cache which is used for consecutive keys optimization in aggregation to keep it enabled", 0) \
     /** Experimental feature for moving data between shards. */ \
     \
     M(Bool, allow_experimental_query_deduplication, false, "Experimental data deduplication for SELECT queries based on part UUIDs", 0) \
@@ -669,6 +679,8 @@ class IColumn;
     M(Bool, database_replicated_always_detach_permanently, false, "Execute DETACH TABLE as DETACH TABLE PERMANENTLY if database engine is Replicated", 0) \
     M(Bool, database_replicated_allow_only_replicated_engine, false, "Allow to create only Replicated tables in database with engine Replicated", 0) \
     M(Bool, database_replicated_allow_replicated_engine_arguments, true, "Allow to create only Replicated tables in database with engine Replicated with explicit arguments", 0) \
+    M(Bool, cloud_mode, false, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, cloud_mode_engine, 1, "Only available in ClickHouse Cloud", 0) \
     M(DistributedDDLOutputMode, distributed_ddl_output_mode, DistributedDDLOutputMode::THROW, "Format of distributed DDL query result, one of: 'none', 'throw', 'null_status_on_timeout', 'never_throw'", 0) \
     M(UInt64, distributed_ddl_entry_format_version, 5, "Compatibility version of distributed DDL (ON CLUSTER) queries", 0) \
     \
@@ -722,6 +734,7 @@ class IColumn;
     M(UInt64, merge_tree_min_bytes_per_task_for_remote_reading, 4 * DBMS_DEFAULT_BUFFER_SIZE, "Min bytes to read per task.", 0) \
     M(Bool, merge_tree_use_const_size_tasks_for_remote_reading, true, "Whether to use constant size tasks for reading from a remote table.", 0) \
     M(Bool, merge_tree_determine_task_size_by_prewhere_columns, true, "Whether to use only prewhere columns size to determine reading task size.", 0) \
+    M(UInt64, merge_tree_compact_parts_min_granules_to_multibuffer_read, 16, "Only available in ClickHouse Cloud", 0) \
     \
     M(Bool, async_insert, false, "If true, data from INSERT query is stored in queue and later flushed to table in background. If wait_for_async_insert is false, INSERT query is processed almost instantly, otherwise client will wait until data will be flushed to table", 0) \
     M(Bool, wait_for_async_insert, true, "If true wait for processing of asynchronous insertion", 0) \
@@ -749,7 +762,7 @@ class IColumn;
     M(UInt64, prefetch_buffer_size, DBMS_DEFAULT_BUFFER_SIZE, "The maximum size of the prefetch buffer to read from the filesystem.", 0) \
     M(UInt64, filesystem_prefetch_step_bytes, 0, "Prefetch step in bytes. Zero means `auto` - approximately the best prefetch step will be auto deduced, but might not be 100% the best. The actual value might be different because of setting filesystem_prefetch_min_bytes_for_single_read_task", 0) \
     M(UInt64, filesystem_prefetch_step_marks, 0, "Prefetch step in marks. Zero means `auto` - approximately the best prefetch step will be auto deduced, but might not be 100% the best. The actual value might be different because of setting filesystem_prefetch_min_bytes_for_single_read_task", 0) \
-    M(UInt64, filesystem_prefetch_min_bytes_for_single_read_task, "8Mi", "Do not parallelize within one file read less than this amount of bytes. E.g. one reader will not receive a read task of size less than this amount. This setting is recommended to avoid spikes of time for aws getObject requests to aws", 0) \
+    M(UInt64, filesystem_prefetch_min_bytes_for_single_read_task, "2Mi", "Do not parallelize within one file read less than this amount of bytes. E.g. one reader will not receive a read task of size less than this amount. This setting is recommended to avoid spikes of time for aws getObject requests to aws", 0) \
     M(UInt64, filesystem_prefetch_max_memory_usage, "1Gi", "Maximum memory usage for prefetches.", 0) \
     M(UInt64, filesystem_prefetches_limit, 200, "Maximum number of prefetches. Zero means unlimited. A setting `filesystem_prefetches_max_memory_usage` is more recommended if you want to limit the number of prefetches", 0) \
     \
@@ -816,7 +829,6 @@ class IColumn;
     M(Bool, allow_experimental_object_type, false, "Allow Object and JSON data types", 0) \
     M(Bool, allow_experimental_annoy_index, false, "Allows to use Annoy index. Disabled by default because this feature is experimental", 0) \
     M(Bool, allow_experimental_usearch_index, false, "Allows to use USearch index. Disabled by default because this feature is experimental", 0) \
-    M(Bool, allow_experimental_s3queue, false, "Allows to use S3Queue engine. Disabled by default, because this feature is experimental", 0) \
     M(UInt64, max_limit_for_ann_queries, 1'000'000, "SELECT queries with LIMIT bigger than this setting cannot use ANN indexes. Helps to prevent memory overflows in ANN search indexes.", 0) \
     M(UInt64, max_threads_for_annoy_index_creation, 4, "Number of threads used to build Annoy indexes (0 means all cores, not recommended)", 0) \
     M(Int64, annoy_index_search_k_nodes, -1, "SELECT queries search up to this many nodes in Annoy indexes.", 0) \
@@ -834,6 +846,11 @@ class IColumn;
     M(Bool, print_pretty_type_names, false, "Print pretty type names in DESCRIBE query and toTypeName() function", 0) \
     M(Bool, create_table_empty_primary_key_by_default, false, "Allow to create *MergeTree tables with empty primary key when ORDER BY and PRIMARY KEY not specified", 0) \
     M(Bool, allow_named_collection_override_by_default, true, "Allow named collections' fields override by default.", 0)\
+    M(Bool, allow_experimental_shared_merge_tree, false, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, cache_warmer_threads, 4, "Only available in ClickHouse Cloud", 0) \
+    M(Int64, ignore_cold_parts_seconds, 0, "Only available in ClickHouse Cloud", 0) \
+    M(Int64, prefer_warmed_unmerged_parts_seconds, 0, "Only available in ClickHouse Cloud", 0) \
+    M(Bool, enable_order_by_all, true, "Enable sorting expression ORDER BY ALL.", 0)\
 
 // End of COMMON_SETTINGS
 // Please add settings related to formats into the FORMAT_FACTORY_SETTINGS, move obsolete settings to OBSOLETE_SETTINGS and obsolete format settings to OBSOLETE_FORMAT_SETTINGS.
@@ -898,6 +915,7 @@ class IColumn;
     MAKE_OBSOLETE(M, Bool, query_cache_store_results_of_queries_with_nondeterministic_functions, false) \
     MAKE_OBSOLETE(M, Bool, optimize_move_functions_out_of_any, false) \
     MAKE_OBSOLETE(M, Bool, allow_experimental_undrop_table_query, true) \
+    MAKE_OBSOLETE(M, Bool, allow_experimental_s3queue, true) \
 
     /** The section above is for obsolete settings. Do not add anything there. */
 
@@ -926,12 +944,12 @@ class IColumn;
     M(Bool, input_format_parquet_preserve_order, false, "Avoid reordering rows when reading from Parquet files. Usually makes it much slower.", 0) \
     M(Bool, input_format_parquet_filter_push_down, true, "When reading Parquet files, skip whole row groups based on the WHERE/PREWHERE expressions and min/max statistics in the Parquet metadata.", 0) \
     M(Bool, input_format_allow_seeks, true, "Allow seeks while reading in ORC/Parquet/Arrow input formats", 0) \
-    M(Bool, input_format_orc_allow_missing_columns, false, "Allow missing columns while reading ORC input formats", 0) \
+    M(Bool, input_format_orc_allow_missing_columns, true, "Allow missing columns while reading ORC input formats", 0) \
     M(Bool, input_format_orc_use_fast_decoder, true, "Use a faster ORC decoder implementation.", 0) \
     M(Bool, input_format_orc_filter_push_down, true, "When reading ORC files, skip whole stripes or row groups based on the WHERE/PREWHERE expressions, min/max statistics or bloom filter in the ORC metadata.", 0) \
-    M(Bool, input_format_parquet_allow_missing_columns, false, "Allow missing columns while reading Parquet input formats", 0) \
+    M(Bool, input_format_parquet_allow_missing_columns, true, "Allow missing columns while reading Parquet input formats", 0) \
     M(UInt64, input_format_parquet_local_file_min_bytes_for_seek, 8192, "Min bytes required for local read (file) to do seek, instead of read with ignore in Parquet input format", 0) \
-    M(Bool, input_format_arrow_allow_missing_columns, false, "Allow missing columns while reading Arrow input formats", 0) \
+    M(Bool, input_format_arrow_allow_missing_columns, true, "Allow missing columns while reading Arrow input formats", 0) \
     M(Char, input_format_hive_text_fields_delimiter, '\x01', "Delimiter between fields in Hive Text File", 0) \
     M(Char, input_format_hive_text_collection_items_delimiter, '\x02', "Delimiter between collection(array or map) items in Hive Text File", 0) \
     M(Char, input_format_hive_text_map_keys_delimiter, '\x03', "Delimiter between a pair of map key/values in Hive Text File", 0) \
@@ -940,6 +958,7 @@ class IColumn;
     M(UInt64, input_format_max_rows_to_read_for_schema_inference, 25000, "The maximum rows of data to read for automatic schema inference", 0) \
     M(UInt64, input_format_max_bytes_to_read_for_schema_inference, 32 * 1024 * 1024, "The maximum bytes of data to read for automatic schema inference", 0) \
     M(Bool, input_format_csv_use_best_effort_in_schema_inference, true, "Use some tweaks and heuristics to infer schema in CSV format", 0) \
+    M(Bool, input_format_csv_try_infer_numbers_from_strings, false, "Try to infer numbers from string fields while schema inference in CSV format", 0) \
     M(Bool, input_format_tsv_use_best_effort_in_schema_inference, true, "Use some tweaks and heuristics to infer schema in TSV format", 0) \
     M(Bool, input_format_csv_detect_header, true, "Automatically detect header with names and types in CSV format", 0) \
     M(Bool, input_format_csv_allow_whitespace_or_tab_as_delimiter, false, "Allow to use spaces and tabs(\\t) as field delimiter in the CSV strings", 0) \
@@ -959,6 +978,7 @@ class IColumn;
     M(Bool, input_format_arrow_skip_columns_with_unsupported_types_in_schema_inference, false, "Skip columns with unsupported types while schema inference for format Arrow", 0) \
     M(String, column_names_for_schema_inference, "", "The list of column names to use in schema inference for formats without column names. The format: 'column1,column2,column3,...'", 0) \
     M(String, schema_inference_hints, "", "The list of column names and types to use in schema inference for formats without column names. The format: 'column_name1 column_type1, column_name2 column_type2, ...'", 0) \
+    M(SchemaInferenceMode, schema_inference_mode, "default", "Mode of schema inference. 'default' - assume that all files have the same schema and schema can be inferred from any file, 'union' - files can have different schemas and the resulting schema should be the a union of schemas of all files", 0) \
     M(Bool, schema_inference_make_columns_nullable, true, "If set to true, all inferred types will be Nullable in schema inference for formats without information about nullability.", 0) \
     M(Bool, input_format_json_read_bools_as_numbers, true, "Allow to parse bools as numbers in JSON input formats", 0) \
     M(Bool, input_format_json_try_infer_numbers_from_strings, false, "Try to infer numbers from string fields while schema inference", 0) \
diff --git a/src/Core/SettingsChangesHistory.h b/src/Core/SettingsChangesHistory.h
index 90a18b9b2f5..aad57ffebb7 100644
--- a/src/Core/SettingsChangesHistory.h
+++ b/src/Core/SettingsChangesHistory.h
@@ -7,6 +7,7 @@
 #include <boost/algorithm/string.hpp>
 #include <map>
 
+
 namespace DB
 {
 
@@ -80,6 +81,10 @@ namespace SettingsChangesHistory
 /// It's used to implement `compatibility` setting (see https://github.com/ClickHouse/ClickHouse/issues/35972)
 static std::map<ClickHouseVersion, SettingsChangesHistory::SettingsChanges> settings_changes_history =
 {
+    {"23.12", {{"allow_suspicious_ttl_expressions", true, false, "It is a new setting, and in previous versions the behavior was equivalent to allowing."},
+              {"input_format_parquet_allow_missing_columns", false, true, "Allow missing columns in Parquet files by default"},
+              {"input_format_orc_allow_missing_columns", false, true, "Allow missing columns in ORC files by default"},
+              {"input_format_arrow_allow_missing_columns", false, true, "Allow missing columns in Arrow files by default"}}},
     {"23.9", {{"optimize_group_by_constant_keys", false, true, "Optimize group by constant keys by default"},
               {"input_format_json_try_infer_named_tuples_from_objects", false, true, "Try to infer named Tuples from JSON objects by default"},
               {"input_format_json_read_numbers_as_strings", false, true, "Allow to read numbers as strings in JSON formats by default"},
diff --git a/src/Core/SettingsEnums.cpp b/src/Core/SettingsEnums.cpp
index b853b0d0a0b..ee113a6776f 100644
--- a/src/Core/SettingsEnums.cpp
+++ b/src/Core/SettingsEnums.cpp
@@ -196,9 +196,12 @@ IMPLEMENT_SETTING_ENUM(ExternalCommandStderrReaction, ErrorCodes::BAD_ARGUMENTS,
      {"log_last", ExternalCommandStderrReaction::LOG_LAST},
      {"throw", ExternalCommandStderrReaction::THROW}})
 
-IMPLEMENT_SETTING_ENUM(DateTimeOverflowBehavior, ErrorCodes::BAD_ARGUMENTS,
-                       {{"throw", FormatSettings::DateTimeOverflowBehavior::Throw},
-                        {"ignore", FormatSettings::DateTimeOverflowBehavior::Ignore},
-                        {"saturate", FormatSettings::DateTimeOverflowBehavior::Saturate}})
+IMPLEMENT_SETTING_ENUM(SchemaInferenceMode, ErrorCodes::BAD_ARGUMENTS,
+    {{"default", SchemaInferenceMode::DEFAULT},
+     {"union", SchemaInferenceMode::UNION}})
 
+IMPLEMENT_SETTING_ENUM(DateTimeOverflowBehavior, ErrorCodes::BAD_ARGUMENTS,
+    {{"throw", FormatSettings::DateTimeOverflowBehavior::Throw},
+     {"ignore", FormatSettings::DateTimeOverflowBehavior::Ignore},
+     {"saturate", FormatSettings::DateTimeOverflowBehavior::Saturate}})
 }
diff --git a/src/Core/SettingsEnums.h b/src/Core/SettingsEnums.h
index 0d6e87f25c2..7977a0b3ab6 100644
--- a/src/Core/SettingsEnums.h
+++ b/src/Core/SettingsEnums.h
@@ -133,6 +133,8 @@ enum class DefaultTableEngine
     ReplacingMergeTree,
     ReplicatedMergeTree,
     ReplicatedReplacingMergeTree,
+    SharedMergeTree,
+    SharedReplacingMergeTree,
     Memory,
 };
 
@@ -252,6 +254,14 @@ DECLARE_SETTING_ENUM(S3QueueAction)
 
 DECLARE_SETTING_ENUM(ExternalCommandStderrReaction)
 
+enum class SchemaInferenceMode
+{
+    DEFAULT,
+    UNION,
+};
+
+DECLARE_SETTING_ENUM(SchemaInferenceMode)
+
 DECLARE_SETTING_ENUM_WITH_RENAME(DateTimeOverflowBehavior, FormatSettings::DateTimeOverflowBehavior)
 
 }
diff --git a/src/Daemon/BaseDaemon.cpp b/src/Daemon/BaseDaemon.cpp
index d66bdf3583f..44a47de6918 100644
--- a/src/Daemon/BaseDaemon.cpp
+++ b/src/Daemon/BaseDaemon.cpp
@@ -92,10 +92,10 @@ PipeFDs signal_pipe;
 static void call_default_signal_handler(int sig)
 {
     if (SIG_ERR == signal(sig, SIG_DFL))
-        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler");
 
     if (0 != raise(sig))
-        throwFromErrno("Cannot send signal.", ErrorCodes::CANNOT_SEND_SIGNAL);
+        throw ErrnoException(ErrorCodes::CANNOT_SEND_SIGNAL, "Cannot send signal");
 }
 
 static const size_t signal_pipe_buf_size =
@@ -659,7 +659,17 @@ BaseDaemon::~BaseDaemon()
     /// Reset signals to SIG_DFL to avoid trying to write to the signal_pipe that will be closed after.
     for (int sig : handled_signals)
         if (SIG_ERR == signal(sig, SIG_DFL))
-            throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+        {
+            try
+            {
+                throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler");
+            }
+            catch (ErrnoException &)
+            {
+                tryLogCurrentException(__PRETTY_FUNCTION__);
+            }
+        }
+
     signal_pipe.close();
 }
 
@@ -1129,7 +1139,7 @@ void BaseDaemon::setupWatchdog()
         pid = fork();
 
         if (-1 == pid)
-            throwFromErrno("Cannot fork", ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot fork");
 
         if (0 == pid)
         {
@@ -1225,7 +1235,7 @@ void BaseDaemon::setupWatchdog()
                 if (SIG_ERR == signal(sig, SIG_IGN))
                 {
                     char * signal_description = strsignal(sig); // NOLINT(concurrency-mt-unsafe)
-                    throwFromErrno(fmt::format("Cannot ignore {}", signal_description), ErrorCodes::SYSTEM_ERROR);
+                    throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot ignore {}", signal_description);
                 }
             }
         }
@@ -1315,7 +1325,7 @@ void systemdNotify(const std::string_view & command)
     int s = socket(AF_UNIX, SOCK_DGRAM | SOCK_CLOEXEC, 0);
 
     if (s == -1)
-        throwFromErrno("Can't create UNIX socket for systemd notify.", ErrorCodes::SYSTEM_ERROR);
+        throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Can't create UNIX socket for systemd notify");
 
     SCOPE_EXIT({ close(s); });
 
@@ -1351,7 +1361,7 @@ void systemdNotify(const std::string_view & command)
             if (errno == EINTR)
                 continue;
             else
-                throwFromErrno("Failed to notify systemd, sendto returned error.", ErrorCodes::SYSTEM_ERROR);
+                throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Failed to notify systemd, sendto returned error");
         }
         else
             sent_bytes_total += sent_bytes;
diff --git a/src/DataTypes/DataTypeCustom.h b/src/DataTypes/DataTypeCustom.h
index 675673ee1fd..cf1e943d8e9 100644
--- a/src/DataTypes/DataTypeCustom.h
+++ b/src/DataTypes/DataTypeCustom.h
@@ -22,8 +22,6 @@ public:
     virtual ~IDataTypeCustomName() = default;
 
     virtual String getName() const = 0;
-
-    virtual bool identical(const IDataTypeCustomName & rhs) const = 0;
 };
 
 using DataTypeCustomNamePtr = std::unique_ptr<const IDataTypeCustomName>;
@@ -53,12 +51,6 @@ private:
 public:
     explicit DataTypeCustomFixedName(String name_) : name(name_) {}
     String getName() const override { return name; }
-    bool identical(const IDataTypeCustomName & rhs_) const override
-    {
-        if (const auto * rhs = typeid_cast<decltype(this)>(&rhs_))
-            return name == rhs->getName();
-        return false;
-    }
 };
 
 }
diff --git a/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp b/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp
index 791bc64f3de..aa3b154e49b 100644
--- a/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp
+++ b/src/DataTypes/DataTypeCustomSimpleAggregateFunction.cpp
@@ -169,19 +169,4 @@ void registerDataTypeDomainSimpleAggregateFunction(DataTypeFactory & factory)
     factory.registerDataTypeCustom("SimpleAggregateFunction", create);
 }
 
-bool DataTypeCustomSimpleAggregateFunction::identical(const IDataTypeCustomName & rhs_) const
-{
-    if (const auto * rhs = typeid_cast<decltype(this)>(&rhs_))
-    {
-        if (parameters != rhs->parameters)
-            return false;
-        if (argument_types.size() != rhs->argument_types.size())
-            return false;
-        for (size_t i = 0; i < argument_types.size(); ++i)
-            if (!argument_types[i]->identical(*rhs->argument_types[i]))
-                return false;
-        return function->getName() == rhs->function->getName();
-    }
-    return false;
-}
 }
diff --git a/src/DataTypes/DataTypeCustomSimpleAggregateFunction.h b/src/DataTypes/DataTypeCustomSimpleAggregateFunction.h
index dd68756d82e..926dfd9cc82 100644
--- a/src/DataTypes/DataTypeCustomSimpleAggregateFunction.h
+++ b/src/DataTypes/DataTypeCustomSimpleAggregateFunction.h
@@ -36,7 +36,6 @@ public:
 
     AggregateFunctionPtr getFunction() const { return function; }
     String getName() const override;
-    bool identical(const IDataTypeCustomName & rhs_) const override;
     static void checkSupportedFunctions(const AggregateFunctionPtr & function);
 };
 
diff --git a/src/DataTypes/DataTypeEnum.cpp b/src/DataTypes/DataTypeEnum.cpp
index e5efb73cfca..a1d5e4b39b7 100644
--- a/src/DataTypes/DataTypeEnum.cpp
+++ b/src/DataTypes/DataTypeEnum.cpp
@@ -170,7 +170,7 @@ bool DataTypeEnum<Type>::contains(const IDataType & rhs) const
 template <typename Type>
 SerializationPtr DataTypeEnum<Type>::doGetDefaultSerialization() const
 {
-    return std::make_shared<SerializationEnum<Type>>(this->getValues());
+    return std::make_shared<SerializationEnum<Type>>(std::static_pointer_cast<const DataTypeEnum<Type>>(shared_from_this()));
 }
 
 
diff --git a/src/DataTypes/DataTypeNested.cpp b/src/DataTypes/DataTypeNested.cpp
index a916b2a5a2b..a4b7442393c 100644
--- a/src/DataTypes/DataTypeNested.cpp
+++ b/src/DataTypes/DataTypeNested.cpp
@@ -72,19 +72,4 @@ DataTypePtr createNested(const DataTypes & types, const Names & names)
     return DataTypeFactory::instance().getCustom(std::move(custom_desc));
 }
 
-bool DataTypeNestedCustomName::identical(const IDataTypeCustomName & rhs_) const
-{
-    if (const auto * rhs = typeid_cast<decltype(this)>(&rhs_))
-    {
-        if (names != rhs->names)
-            return false;
-        if (elems.size() != rhs->elems.size())
-            return false;
-        for (size_t i = 0; i < elems.size(); ++i)
-            if (!elems[i]->identical(*rhs->elems[i]))
-                return false;
-        return true;
-    }
-    return false;
-}
 }
diff --git a/src/DataTypes/DataTypeNested.h b/src/DataTypes/DataTypeNested.h
index 5b4aa290091..1ad06477a6e 100644
--- a/src/DataTypes/DataTypeNested.h
+++ b/src/DataTypes/DataTypeNested.h
@@ -19,7 +19,6 @@ public:
     }
 
     String getName() const override;
-    bool identical(const IDataTypeCustomName & rhs_) const override;
 };
 
 DataTypePtr createNested(const DataTypes & types, const Names & names);
diff --git a/src/DataTypes/IDataType.cpp b/src/DataTypes/IDataType.cpp
index ad3c1a78aed..2a7e0f246de 100644
--- a/src/DataTypes/IDataType.cpp
+++ b/src/DataTypes/IDataType.cpp
@@ -252,17 +252,4 @@ SerializationPtr IDataType::getSerialization(const NameAndTypePair & column)
     return column.type->getDefaultSerialization();
 }
 
-bool IDataType::identical(const IDataType & rhs) const
-{
-    const auto * rhs_custom_name = rhs.getCustomName();
-    if (custom_name && rhs_custom_name)
-    {
-        return custom_name->identical(*rhs_custom_name);
-    }
-    else if (custom_name || rhs_custom_name)
-        return false;
-    else
-        return equals(rhs);
-}
-
 }
diff --git a/src/DataTypes/IDataType.h b/src/DataTypes/IDataType.h
index 4ee615f5f70..eabf066bc3d 100644
--- a/src/DataTypes/IDataType.h
+++ b/src/DataTypes/IDataType.h
@@ -177,12 +177,6 @@ public:
     /// Checks that two instances belong to the same type
     virtual bool equals(const IDataType & rhs) const = 0;
 
-    /** Checks that two types are exactly identical. Note that two types may be equal but not identical.
-      * For example, `SimpleAggregateFunction(max, String)` and `SimpleAggregateFunction(anyLast, String)`
-      * This is used when creating a replicated table. Column types in different replicas must be identical
-      */
-    virtual bool identical(const IDataType & rhs) const;
-
     /// Various properties on behaviour of data type.
 
     /** The data type is dependent on parameters and types with different parameters are different.
@@ -446,6 +440,8 @@ template <typename T> inline bool isFloat(const T & data_type) { return WhichDat
 template <typename T> inline bool isNativeNumber(const T & data_type) { return WhichDataType(data_type).isNativeNumber(); }
 template <typename T> inline bool isNumber(const T & data_type) { return WhichDataType(data_type).isNumber(); }
 
+template <typename T> inline bool isEnum8(const T & data_type) { return WhichDataType(data_type).isEnum8(); }
+template <typename T> inline bool isEnum16(const T & data_type) { return WhichDataType(data_type).isEnum16(); }
 template <typename T> inline bool isEnum(const T & data_type) { return WhichDataType(data_type).isEnum(); }
 
 template <typename T> inline bool isDate(const T & data_type) { return WhichDataType(data_type).isDate(); }
diff --git a/src/DataTypes/NestedUtils.cpp b/src/DataTypes/NestedUtils.cpp
index efac2454a03..a7cc1b21389 100644
--- a/src/DataTypes/NestedUtils.cpp
+++ b/src/DataTypes/NestedUtils.cpp
@@ -77,10 +77,11 @@ static Block flattenImpl(const Block & block, bool flatten_named_tuple)
 
     for (const auto & elem : block)
     {
-        if (const DataTypeArray * type_arr = typeid_cast<const DataTypeArray *>(elem.type.get()))
+        if (isNested(elem.type))
         {
-            const DataTypeTuple * type_tuple = typeid_cast<const DataTypeTuple *>(type_arr->getNestedType().get());
-            if (type_tuple && type_tuple->haveExplicitNames())
+            const DataTypeArray * type_arr = assert_cast<const DataTypeArray *>(elem.type.get());
+            const DataTypeTuple * type_tuple = assert_cast<const DataTypeTuple *>(type_arr->getNestedType().get());
+            if (type_tuple->haveExplicitNames())
             {
                 const DataTypes & element_types = type_tuple->getElements();
                 const Strings & names = type_tuple->getElementNames();
@@ -149,7 +150,7 @@ Block flatten(const Block & block)
 }
 
 
-Block flattenArrayOfTuples(const Block & block)
+Block flattenNested(const Block & block)
 {
     return flattenImpl(block, false);
 }
diff --git a/src/DataTypes/NestedUtils.h b/src/DataTypes/NestedUtils.h
index e009ceb18fe..85c29d2c08f 100644
--- a/src/DataTypes/NestedUtils.h
+++ b/src/DataTypes/NestedUtils.h
@@ -20,13 +20,13 @@ namespace Nested
 
     /// Flat a column of nested type into columns
     /// 1) For named tuples，t Tuple(x .., y ..., ...), replace it with t.x ..., t.y ... , ...
-    /// 2) For an Array with named Tuple element column, a Array(Tuple(x ..., y ..., ...)), replace it with multiple Array Columns, a.x ..., a.y ..., ...
+    /// 2) For an Nested column, a Array(Tuple(x ..., y ..., ...)), replace it with multiple Array Columns, a.x ..., a.y ..., ...
     Block flatten(const Block & block);
 
-    /// Same as flatten but only for Array with named Tuple element column.
-    Block flattenArrayOfTuples(const Block & block);
+    /// Same as flatten but only for Nested column.
+    Block flattenNested(const Block & block);
 
-    /// Collect Array columns in a form of `column_name.element_name` to single Array(Tuple(...)) column.
+    /// Collect Array columns in a form of `column_name.element_name` to single Nested column.
     NamesAndTypesList collect(const NamesAndTypesList & names_and_types);
 
     /// Convert old-style nested (single arrays with same prefix, `n.a`, `n.b`...) to subcolumns of data type Nested.
diff --git a/src/DataTypes/Serializations/SerializationArray.cpp b/src/DataTypes/Serializations/SerializationArray.cpp
index c804f58c567..0d99b741a23 100644
--- a/src/DataTypes/Serializations/SerializationArray.cpp
+++ b/src/DataTypes/Serializations/SerializationArray.cpp
@@ -348,6 +348,8 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 {
     auto mutable_column = column->assumeMutable();
     ColumnArray & column_array = typeid_cast<ColumnArray &>(*mutable_column);
+    size_t prev_last_offset = column_array.getOffsets().back();
+
     settings.path.push_back(Substream::ArraySizes);
 
     if (auto cached_column = getFromSubstreamsCache(cache, settings.path))
@@ -371,9 +373,9 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
 
     /// Number of values corresponding with `offset_values` must be read.
     size_t last_offset = offset_values.back();
-    if (last_offset < nested_column->size())
+    if (last_offset < prev_last_offset)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Nested column is longer than last offset");
-    size_t nested_limit = last_offset - nested_column->size();
+    size_t nested_limit = last_offset - prev_last_offset;
 
     if (unlikely(nested_limit > MAX_ARRAYS_SIZE))
         throw Exception(ErrorCodes::TOO_LARGE_ARRAY_SIZE, "Array sizes are too large: {}", nested_limit);
@@ -388,7 +390,7 @@ void SerializationArray::deserializeBinaryBulkWithMultipleStreams(
     /// Check consistency between offsets and elements subcolumns.
     /// But if elements column is empty - it's ok for columns of Nested types that was added by ALTER.
     if (!nested_column->empty() && nested_column->size() != last_offset)
-        throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Cannot read all array values: read just {} of {}",
+        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Cannot read all array values: read just {} of {}",
             toString(nested_column->size()), toString(last_offset));
 
     column = std::move(mutable_column);
@@ -443,7 +445,7 @@ static void deserializeTextImpl(IColumn & column, ReadBuffer & istr, Reader && r
                 if (*istr.position() == ',')
                     ++istr.position();
                 else
-                    throw ParsingException(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT,
+                    throw Exception(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT,
                         "Cannot read array from text, expected comma or end of array, found '{}'",
                         *istr.position());
             }
diff --git a/src/DataTypes/Serializations/SerializationEnum.cpp b/src/DataTypes/Serializations/SerializationEnum.cpp
index 09b0b02714c..9b3a437e9cf 100644
--- a/src/DataTypes/Serializations/SerializationEnum.cpp
+++ b/src/DataTypes/Serializations/SerializationEnum.cpp
@@ -11,13 +11,13 @@ namespace DB
 template <typename Type>
 void SerializationEnum<Type>::serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
-    writeString(this->getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]), ostr);
+    writeString(ref_enum_values.getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]), ostr);
 }
 
 template <typename Type>
 void SerializationEnum<Type>::serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
-    writeEscapedString(this->getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr);
+    writeEscapedString(ref_enum_values.getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr);
 }
 
 template <typename Type>
@@ -30,14 +30,14 @@ void SerializationEnum<Type>::deserializeTextEscaped(IColumn & column, ReadBuffe
         /// NOTE It would be nice to do without creating a temporary object - at least extract std::string out.
         std::string field_name;
         readEscapedString(field_name, istr);
-        assert_cast<ColumnType &>(column).getData().push_back(this->getValue(StringRef(field_name), true));
+        assert_cast<ColumnType &>(column).getData().push_back(ref_enum_values.getValue(StringRef(field_name), true));
     }
 }
 
 template <typename Type>
 void SerializationEnum<Type>::serializeTextQuoted(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
-    writeQuotedString(this->getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]), ostr);
+    writeQuotedString(ref_enum_values.getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]), ostr);
 }
 
 template <typename Type>
@@ -45,7 +45,7 @@ void SerializationEnum<Type>::deserializeTextQuoted(IColumn & column, ReadBuffer
 {
     std::string field_name;
     readQuotedStringWithSQLStyle(field_name, istr);
-    assert_cast<ColumnType &>(column).getData().push_back(this->getValue(StringRef(field_name)));
+    assert_cast<ColumnType &>(column).getData().push_back(ref_enum_values.getValue(StringRef(field_name)));
 }
 
 template <typename Type>
@@ -61,20 +61,20 @@ void SerializationEnum<Type>::deserializeWholeText(IColumn & column, ReadBuffer
     {
         std::string field_name;
         readStringUntilEOF(field_name, istr);
-        assert_cast<ColumnType &>(column).getData().push_back(this->getValue(StringRef(field_name), true));
+        assert_cast<ColumnType &>(column).getData().push_back(ref_enum_values.getValue(StringRef(field_name), true));
     }
 }
 
 template <typename Type>
 void SerializationEnum<Type>::serializeTextJSON(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
-    writeJSONString(this->getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr, settings);
+    writeJSONString(ref_enum_values.getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr, settings);
 }
 
 template <typename Type>
 void SerializationEnum<Type>::serializeTextXML(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
-    writeXMLStringForTextElement(this->getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr);
+    writeXMLStringForTextElement(ref_enum_values.getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr);
 }
 
 template <typename Type>
@@ -86,14 +86,14 @@ void SerializationEnum<Type>::deserializeTextJSON(IColumn & column, ReadBuffer &
     {
         std::string field_name;
         readJSONString(field_name, istr);
-        assert_cast<ColumnType &>(column).getData().push_back(this->getValue(StringRef(field_name)));
+        assert_cast<ColumnType &>(column).getData().push_back(ref_enum_values.getValue(StringRef(field_name)));
     }
 }
 
 template <typename Type>
 void SerializationEnum<Type>::serializeTextCSV(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const
 {
-    writeCSVString(this->getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]), ostr);
+    writeCSVString(ref_enum_values.getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]), ostr);
 }
 
 template <typename Type>
@@ -105,7 +105,7 @@ void SerializationEnum<Type>::deserializeTextCSV(IColumn & column, ReadBuffer &
     {
         std::string field_name;
         readCSVString(field_name, istr, settings.csv);
-        assert_cast<ColumnType &>(column).getData().push_back(this->getValue(StringRef(field_name), true));
+        assert_cast<ColumnType &>(column).getData().push_back(ref_enum_values.getValue(StringRef(field_name), true));
     }
 }
 
@@ -114,7 +114,7 @@ void SerializationEnum<Type>::serializeTextMarkdown(
     const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings & settings) const
 {
     if (settings.markdown.escape_special_characters)
-        writeMarkdownEscapedString(this->getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr);
+        writeMarkdownEscapedString(ref_enum_values.getNameForValue(assert_cast<const ColumnType &>(column).getData()[row_num]).toView(), ostr);
     else
         serializeTextEscaped(column, row_num, ostr, settings);
 }
diff --git a/src/DataTypes/Serializations/SerializationEnum.h b/src/DataTypes/Serializations/SerializationEnum.h
index 49a0e4943e0..03b134e59a6 100644
--- a/src/DataTypes/Serializations/SerializationEnum.h
+++ b/src/DataTypes/Serializations/SerializationEnum.h
@@ -1,20 +1,35 @@
 #pragma once
 
+#include <memory>
 #include <DataTypes/Serializations/SerializationNumber.h>
 #include <DataTypes/EnumValues.h>
+#include <DataTypes/DataTypeEnum.h>
 
 namespace DB
 {
 
 template <typename Type>
-class SerializationEnum : public SerializationNumber<Type>, public EnumValues<Type>
+class SerializationEnum : public SerializationNumber<Type>
 {
 public:
     using typename SerializationNumber<Type>::FieldType;
     using typename SerializationNumber<Type>::ColumnType;
-    using typename EnumValues<Type>::Values;
+    using Values = EnumValues<Type>::Values;
 
-    explicit SerializationEnum(const Values & values_) : EnumValues<Type>(values_) {}
+    // SerializationEnum can be constructed in two ways:
+    /// - Make a copy of the Enum name-to-type mapping.
+    /// - Only store a reference to an existing mapping. This is faster if the Enum has a lot of different values or if SerializationEnum is
+    ///   constructed very frequently. Make sure that the pointed-to mapping has a longer lifespan than SerializationEnum!
+
+    explicit SerializationEnum(const Values & values_)
+        : own_enum_values(values_), ref_enum_values(own_enum_values.value())
+    {
+    }
+
+    explicit SerializationEnum(const std::shared_ptr<const DataTypeEnum<Type>> & enum_type)
+        : own_enum_type(enum_type), ref_enum_values(*enum_type)
+    {
+    }
 
     void serializeText(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
     void serializeTextEscaped(const IColumn & column, size_t row_num, WriteBuffer & ostr, const FormatSettings &) const override;
@@ -35,8 +50,12 @@ public:
     {
         FieldType x;
         readText(x, istr);
-        return this->findByValue(x)->first;
+        return ref_enum_values.findByValue(x)->first;
     }
+
+    std::optional<EnumValues<Type>> own_enum_values;
+    std::shared_ptr<const DataTypeEnum<Type>> own_enum_type;
+    const EnumValues<Type> & ref_enum_values;
 };
 
 }
diff --git a/src/DataTypes/Serializations/SerializationNullable.cpp b/src/DataTypes/Serializations/SerializationNullable.cpp
index 15203bdc9fa..d9efc6fff10 100644
--- a/src/DataTypes/Serializations/SerializationNullable.cpp
+++ b/src/DataTypes/Serializations/SerializationNullable.cpp
@@ -359,7 +359,7 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
         nested_column.popBack(1);
 
         if (null_representation.find('\t') != std::string::npos || null_representation.find('\n') != std::string::npos)
-            throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "TSV custom null representation "
+            throw DB::Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "TSV custom null representation "
                                        "containing '\\t' or '\\n' may not work correctly for large input.");
 
         WriteBufferFromOwnString parsed_value;
@@ -367,7 +367,7 @@ ReturnType SerializationNullable::deserializeTextEscapedAndRawImpl(IColumn & col
             nested_serialization->serializeTextEscaped(nested_column, nested_column.size() - 1, parsed_value, settings);
         else
             nested_serialization->serializeTextRaw(nested_column, nested_column.size() - 1, parsed_value, settings);
-        throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while parsing \"{}{}\" as Nullable"
+        throw DB::Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while parsing \"{}{}\" as Nullable"
                                    " at position {}: got \"{}\", which was deserialized as \"{}\". "
                                    "It seems that input data is ill-formatted.",
                                    std::string(pos, buf.buffer().end()),
@@ -452,7 +452,7 @@ ReturnType SerializationNullable::deserializeTextQuotedImpl(IColumn & column, Re
         /// It can happen only if there is an unquoted string instead of a number.
         /// We also should delete incorrectly deserialized value from nested column.
         nested_column.popBack(1);
-        throw DB::ParsingException(
+        throw DB::Exception(
             ErrorCodes::CANNOT_READ_ALL_DATA,
             "Error while parsing Nullable: got an unquoted string {} instead of a number",
             String(buf.position(), std::min(10ul, buf.available())));
@@ -589,12 +589,12 @@ ReturnType SerializationNullable::deserializeTextCSVImpl(IColumn & column, ReadB
 
         if (null_representation.find(settings.csv.delimiter) != std::string::npos || null_representation.find('\r') != std::string::npos
             || null_representation.find('\n') != std::string::npos)
-            throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "CSV custom null representation containing "
+            throw DB::Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "CSV custom null representation containing "
                                        "format_csv_delimiter, '\\r' or '\\n' may not work correctly for large input.");
 
         WriteBufferFromOwnString parsed_value;
         nested_serialization->serializeTextCSV(nested_column, nested_column.size() - 1, parsed_value, settings);
-        throw DB::ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while parsing \"{}{}\" as Nullable"
+        throw DB::Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while parsing \"{}{}\" as Nullable"
                                    " at position {}: got \"{}\", which was deserialized as \"{}\". "
                                    "It seems that input data is ill-formatted.",
                                    std::string(pos, buf.buffer().end()),
diff --git a/src/DataTypes/Serializations/SerializationString.cpp b/src/DataTypes/Serializations/SerializationString.cpp
index 89fa09781ef..788ff429088 100644
--- a/src/DataTypes/Serializations/SerializationString.cpp
+++ b/src/DataTypes/Serializations/SerializationString.cpp
@@ -152,6 +152,9 @@ template <int UNROLL_TIMES>
 static NO_INLINE void deserializeBinarySSE2(ColumnString::Chars & data, ColumnString::Offsets & offsets, ReadBuffer & istr, size_t limit)
 {
     size_t offset = data.size();
+    /// Avoiding calling resize in a loop improves the performance.
+    data.resize(std::max(data.capacity(), static_cast<size_t>(4096)));
+
     for (size_t i = 0; i < limit; ++i)
     {
         if (istr.eof())
@@ -171,7 +174,8 @@ static NO_INLINE void deserializeBinarySSE2(ColumnString::Chars & data, ColumnSt
         offset += size + 1;
         offsets.push_back(offset);
 
-        data.resize(offset);
+        if (unlikely(offset > data.size()))
+            data.resize_exact(roundUpToPowerOfTwoOrZero(std::max(offset, data.size() * 2)));
 
         if (size)
         {
@@ -203,6 +207,8 @@ static NO_INLINE void deserializeBinarySSE2(ColumnString::Chars & data, ColumnSt
 
         data[offset - 1] = 0;
     }
+
+    data.resize(offset);
 }
 
 
diff --git a/src/Databases/DDLLoadingDependencyVisitor.cpp b/src/Databases/DDLLoadingDependencyVisitor.cpp
index 77a40f674fd..b8690125aaa 100644
--- a/src/Databases/DDLLoadingDependencyVisitor.cpp
+++ b/src/Databases/DDLLoadingDependencyVisitor.cpp
@@ -1,6 +1,10 @@
 #include <Databases/DDLLoadingDependencyVisitor.h>
 #include <Databases/DDLDependencyVisitor.h>
 #include <Dictionaries/getDictionaryConfigurationFromAST.h>
+#include "config.h"
+#if USE_LIBPQXX
+#include <Storages/PostgreSQL/StorageMaterializedPostgreSQL.h>
+#endif
 #include <Interpreters/Context.h>
 #include <Interpreters/misc.h>
 #include <Parsers/ASTCreateQuery.h>
@@ -131,6 +135,14 @@ void DDLLoadingDependencyVisitor::visit(const ASTStorage & storage, Data & data)
         extractTableNameFromArgument(*storage.engine, data, 3);
     else if (storage.engine->name == "Dictionary")
         extractTableNameFromArgument(*storage.engine, data, 0);
+#if USE_LIBPQXX
+    else if (storage.engine->name == "MaterializedPostgreSQL")
+    {
+        const auto * create_query = data.create_query->as<ASTCreateQuery>();
+        auto nested_table = toString(create_query->uuid) + StorageMaterializedPostgreSQL::NESTED_TABLE_SUFFIX;
+        data.dependencies.emplace(QualifiedTableName{ .database = create_query->getDatabase(), .table = nested_table });
+    }
+#endif
 }
 
 
diff --git a/src/Databases/DatabaseAtomic.cpp b/src/Databases/DatabaseAtomic.cpp
index 1daa6351c23..8a5ba5f033f 100644
--- a/src/Databases/DatabaseAtomic.cpp
+++ b/src/Databases/DatabaseAtomic.cpp
@@ -1,6 +1,7 @@
 #include <Databases/DatabaseAtomic.h>
 #include <Databases/DatabaseOnDisk.h>
 #include <Databases/DatabaseReplicated.h>
+#include <Databases/DatabaseFactory.h>
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
 #include <IO/ReadBufferFromFile.h>
@@ -622,4 +623,16 @@ void DatabaseAtomic::checkDetachedTableNotInUse(const UUID & uuid)
     assertDetachedTableNotInUse(uuid);
 }
 
+void registerDatabaseAtomic(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        return make_shared<DatabaseAtomic>(
+            args.database_name,
+            args.metadata_path,
+            args.uuid,
+            args.context);
+    };
+    factory.registerDatabase("Atomic", create_fn);
+}
 }
diff --git a/src/Databases/DatabaseDictionary.cpp b/src/Databases/DatabaseDictionary.cpp
index 3a3dea1d38e..e2e0d52cd88 100644
--- a/src/Databases/DatabaseDictionary.cpp
+++ b/src/Databases/DatabaseDictionary.cpp
@@ -1,4 +1,5 @@
 #include <Databases/DatabaseDictionary.h>
+#include <Databases/DatabaseFactory.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/ExternalDictionariesLoader.h>
 #include <Dictionaries/DictionaryStructure.h>
@@ -140,4 +141,14 @@ void DatabaseDictionary::shutdown()
 {
 }
 
+void registerDatabaseDictionary(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        return make_shared<DatabaseDictionary>(
+            args.database_name,
+            args.context);
+    };
+    factory.registerDatabase("Dictionary", create_fn);
+}
 }
diff --git a/src/Databases/DatabaseFactory.cpp b/src/Databases/DatabaseFactory.cpp
index 53d5245770e..2c2e4030821 100644
--- a/src/Databases/DatabaseFactory.cpp
+++ b/src/Databases/DatabaseFactory.cpp
@@ -1,60 +1,15 @@
-#include <Databases/DatabaseFactory.h>
-
 #include <filesystem>
-#include <Databases/DatabaseAtomic.h>
-#include <Databases/DatabaseDictionary.h>
-#include <Databases/DatabaseFilesystem.h>
-#include <Databases/DatabaseLazy.h>
-#include <Databases/DatabaseMemory.h>
-#include <Databases/DatabaseOrdinary.h>
+
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseReplicated.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/evaluateConstantExpression.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/queryToString.h>
-#include <Storages/NamedCollectionsHelpers.h>
-#include <Common/logger_useful.h>
 #include <Common/Macros.h>
 #include <Common/filesystemHelpers.h>
-
-#include "config.h"
-
-#if USE_MYSQL
-#    include <Core/MySQL/MySQLClient.h>
-#    include <Databases/MySQL/DatabaseMySQL.h>
-#    include <Databases/MySQL/MaterializedMySQLSettings.h>
-#    include <Storages/MySQL/MySQLHelpers.h>
-#    include <Storages/MySQL/MySQLSettings.h>
-#    include <Storages/StorageMySQL.h>
-#    include <Databases/MySQL/DatabaseMaterializedMySQL.h>
-#    include <mysqlxx/Pool.h>
-#endif
-
-#if USE_MYSQL || USE_LIBPQXX
-#include <Common/parseRemoteDescription.h>
-#include <Common/parseAddress.h>
-#endif
-
-#if USE_LIBPQXX
-#include <Databases/PostgreSQL/DatabasePostgreSQL.h>
-#include <Databases/PostgreSQL/DatabaseMaterializedPostgreSQL.h>
-#include <Storages/PostgreSQL/MaterializedPostgreSQLSettings.h>
-#include <Storages/StoragePostgreSQL.h>
-#endif
-
-#if USE_SQLITE
-#include <Databases/SQLite/DatabaseSQLite.h>
-#endif
-
-#if USE_AWS_S3
-#include <Databases/DatabaseS3.h>
-#endif
-
-#if USE_HDFS
-#include <Databases/DatabaseHDFS.h>
-#endif
+#include <Common/logger_useful.h>
 
 namespace fs = std::filesystem;
 
@@ -67,7 +22,7 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int UNKNOWN_DATABASE_ENGINE;
     extern const int CANNOT_CREATE_DATABASE;
-    extern const int NOT_IMPLEMENTED;
+    extern const int LOGICAL_ERROR;
 }
 
 void cckMetadataPathForOrdinary(const ASTCreateQuery & create, const String & metadata_path)
@@ -103,8 +58,47 @@ void cckMetadataPathForOrdinary(const ASTCreateQuery & create, const String & me
 
 }
 
+/// validate validates the database engine that's specified in the create query for
+/// engine arguments, settings and table overrides.
+void validate(const ASTCreateQuery & create_query)
+
+{
+    auto * storage = create_query.storage;
+
+    /// Check engine may have arguments
+    static const std::unordered_set<std::string_view> engines_with_arguments{"MySQL", "MaterializeMySQL", "MaterializedMySQL",
+        "Lazy", "Replicated", "PostgreSQL", "MaterializedPostgreSQL", "SQLite", "Filesystem", "S3", "HDFS"};
+
+    const String & engine_name = storage->engine->name;
+    bool engine_may_have_arguments = engines_with_arguments.contains(engine_name);
+
+    if (storage->engine->arguments && !engine_may_have_arguments)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database engine `{}` cannot have arguments", engine_name);
+
+    /// Check engine may have settings
+    bool may_have_settings = endsWith(engine_name, "MySQL") || engine_name == "Replicated" || engine_name == "MaterializedPostgreSQL";
+    bool has_unexpected_element = storage->engine->parameters || storage->partition_by ||
+        storage->primary_key || storage->order_by ||
+        storage->sample_by;
+    if (has_unexpected_element || (!may_have_settings && storage->settings))
+        throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_AST,
+                        "Database engine `{}` cannot have parameters, primary_key, order_by, sample_by, settings", engine_name);
+
+    /// Check engine with table overrides
+    static const std::unordered_set<std::string_view> engines_with_table_overrides{"MaterializeMySQL", "MaterializedMySQL", "MaterializedPostgreSQL"};
+    if (create_query.table_overrides && !engines_with_table_overrides.contains(engine_name))
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database engine `{}` cannot have table overrides", engine_name);
+}
+
 DatabasePtr DatabaseFactory::get(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context)
 {
+    /// check if the database engine is a valid one before proceeding
+    if (!database_engines.contains(create.storage->engine->name))
+        throw Exception(ErrorCodes::UNKNOWN_DATABASE_ENGINE, "Unknown database engine: {}", create.storage->engine->name);
+
+    /// if the engine is found (i.e. registered with the factory instance), then validate if the
+    /// supplied engine arguments, settings and table overrides are valid for the engine.
+    validate(create);
     cckMetadataPathForOrdinary(create, metadata_path);
 
     DatabasePtr impl = getImpl(create, metadata_path, context);
@@ -119,383 +113,42 @@ DatabasePtr DatabaseFactory::get(const ASTCreateQuery & create, const String & m
     return impl;
 }
 
-template <typename ValueType>
-static inline ValueType safeGetLiteralValue(const ASTPtr &ast, const String &engine_name)
+void DatabaseFactory::registerDatabase(const std::string & name, CreatorFn creator_fn)
 {
-    if (!ast || !ast->as<ASTLiteral>())
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database engine {} requested literal argument.", engine_name);
+    if (!database_engines.emplace(name, std::move(creator_fn)).second)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "DatabaseFactory: the database engine name '{}' is not unique", name);
+}
 
-    return ast->as<ASTLiteral>()->value.safeGet<ValueType>();
+DatabaseFactory & DatabaseFactory::instance()
+{
+    static DatabaseFactory db_fact;
+    return db_fact;
 }
 
 DatabasePtr DatabaseFactory::getImpl(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context)
 {
-    auto * engine_define = create.storage;
+    auto * storage = create.storage;
     const String & database_name = create.getDatabase();
-    const String & engine_name = engine_define->engine->name;
-    const UUID & uuid = create.uuid;
-
-    static const std::unordered_set<std::string_view> database_engines{"Ordinary", "Atomic", "Memory",
-        "Dictionary", "Lazy", "Replicated", "MySQL", "MaterializeMySQL", "MaterializedMySQL",
-        "PostgreSQL", "MaterializedPostgreSQL", "SQLite", "Filesystem", "S3", "HDFS"};
-
-    if (!database_engines.contains(engine_name))
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database engine name `{}` does not exist", engine_name);
-
-    static const std::unordered_set<std::string_view> engines_with_arguments{"MySQL", "MaterializeMySQL", "MaterializedMySQL",
-        "Lazy", "Replicated", "PostgreSQL", "MaterializedPostgreSQL", "SQLite", "Filesystem", "S3", "HDFS"};
-
-    static const std::unordered_set<std::string_view> engines_with_table_overrides{"MaterializeMySQL", "MaterializedMySQL", "MaterializedPostgreSQL"};
-    bool engine_may_have_arguments = engines_with_arguments.contains(engine_name);
-
-    if (engine_define->engine->arguments && !engine_may_have_arguments)
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database engine `{}` cannot have arguments", engine_name);
-
-    bool has_unexpected_element = engine_define->engine->parameters || engine_define->partition_by ||
-                                  engine_define->primary_key || engine_define->order_by ||
-                                  engine_define->sample_by;
-    bool may_have_settings = endsWith(engine_name, "MySQL") || engine_name == "Replicated" || engine_name == "MaterializedPostgreSQL";
-
-    if (has_unexpected_element || (!may_have_settings && engine_define->settings))
-        throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_AST,
-                        "Database engine `{}` cannot have parameters, primary_key, order_by, sample_by, settings", engine_name);
-
-    if (create.table_overrides && !engines_with_table_overrides.contains(engine_name))
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database engine `{}` cannot have table overrides", engine_name);
-
-    if (engine_name == "Ordinary")
-    {
-        if (!create.attach && !context->getSettingsRef().allow_deprecated_database_ordinary)
-            throw Exception(ErrorCodes::UNKNOWN_DATABASE_ENGINE,
-                            "Ordinary database engine is deprecated (see also allow_deprecated_database_ordinary setting)");
-
-        return std::make_shared<DatabaseOrdinary>(database_name, metadata_path, context);
-    }
-
-    if (engine_name == "Atomic")
-        return std::make_shared<DatabaseAtomic>(database_name, metadata_path, uuid, context);
-    else if (engine_name == "Memory")
-        return std::make_shared<DatabaseMemory>(database_name, context);
-    else if (engine_name == "Dictionary")
-        return std::make_shared<DatabaseDictionary>(database_name, context);
-
-#if USE_MYSQL
-
-    else if (engine_name == "MySQL" || engine_name == "MaterializeMySQL" || engine_name == "MaterializedMySQL")
-    {
-        const ASTFunction * engine = engine_define->engine;
-        if (!engine->arguments)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
-
-        StorageMySQL::Configuration configuration;
-        ASTs & arguments = engine->arguments->children;
-        auto mysql_settings = std::make_unique<MySQLSettings>();
-
-        if (auto named_collection = tryGetNamedCollectionWithOverrides(arguments, context))
-        {
-            configuration = StorageMySQL::processNamedCollectionResult(*named_collection, *mysql_settings, context, false);
-        }
-        else
-        {
-            if (arguments.size() != 4)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                    "MySQL database require mysql_hostname, mysql_database_name, mysql_username, mysql_password arguments.");
-
-
-            arguments[1] = evaluateConstantExpressionOrIdentifierAsLiteral(arguments[1], context);
-            const auto & host_port = safeGetLiteralValue<String>(arguments[0], engine_name);
-
-            if (engine_name == "MySQL")
-            {
-                size_t max_addresses = context->getSettingsRef().glob_expansion_max_elements;
-                configuration.addresses = parseRemoteDescriptionForExternalDatabase(host_port, max_addresses, 3306);
-            }
-            else
-            {
-                const auto & [remote_host, remote_port] = parseAddress(host_port, 3306);
-                configuration.host = remote_host;
-                configuration.port = remote_port;
-            }
-
-            configuration.database = safeGetLiteralValue<String>(arguments[1], engine_name);
-            configuration.username = safeGetLiteralValue<String>(arguments[2], engine_name);
-            configuration.password = safeGetLiteralValue<String>(arguments[3], engine_name);
-        }
-
-        try
-        {
-            if (engine_name == "MySQL")
-            {
-                mysql_settings->loadFromQueryContext(context, *engine_define);
-                if (engine_define->settings)
-                    mysql_settings->loadFromQuery(*engine_define);
-
-                auto mysql_pool = createMySQLPoolWithFailover(configuration, *mysql_settings);
-
-                return std::make_shared<DatabaseMySQL>(
-                    context, database_name, metadata_path, engine_define, configuration.database,
-                    std::move(mysql_settings), std::move(mysql_pool), create.attach);
-            }
-
-            MySQLClient client(configuration.host, configuration.port, configuration.username, configuration.password);
-            auto mysql_pool = mysqlxx::Pool(configuration.database, configuration.host, configuration.username, configuration.password, configuration.port);
-
-            auto materialize_mode_settings = std::make_unique<MaterializedMySQLSettings>();
-
-            if (engine_define->settings)
-                materialize_mode_settings->loadFromQuery(*engine_define);
-
-            if (uuid == UUIDHelpers::Nil)
-            {
-                auto print_create_ast = create.clone();
-                print_create_ast->as<ASTCreateQuery>()->attach = false;
-                throw Exception(ErrorCodes::NOT_IMPLEMENTED,
-                        "The MaterializedMySQL database engine no longer supports Ordinary databases. To re-create the database, delete "
-                        "the old one by executing \"rm -rf {}{{,.sql}}\", then re-create the database with the following query: {}",
-                        metadata_path,
-                        queryToString(print_create_ast));
-            }
-
-            return std::make_shared<DatabaseMaterializedMySQL>(
-                context, database_name, metadata_path, uuid, configuration.database, std::move(mysql_pool),
-                std::move(client), std::move(materialize_mode_settings));
-        }
-        catch (...)
-        {
-            const auto & exception_message = getCurrentExceptionMessage(true);
-            throw Exception(ErrorCodes::CANNOT_CREATE_DATABASE, "Cannot create MySQL database, because {}", exception_message);
-        }
-    }
-#endif
-
-    else if (engine_name == "Lazy")
-    {
-        const ASTFunction * engine = engine_define->engine;
-
-        if (!engine->arguments || engine->arguments->children.size() != 1)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Lazy database require cache_expiration_time_seconds argument");
-
-        const auto & arguments = engine->arguments->children;
-
-        const auto cache_expiration_time_seconds = safeGetLiteralValue<UInt64>(arguments[0], "Lazy");
-        return std::make_shared<DatabaseLazy>(database_name, metadata_path, cache_expiration_time_seconds, context);
-    }
-
-    else if (engine_name == "Replicated")
-    {
-        const ASTFunction * engine = engine_define->engine;
-
-        if (!engine->arguments || engine->arguments->children.size() != 3)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Replicated database requires 3 arguments: zookeeper path, shard name and replica name");
-
-        auto & arguments = engine->arguments->children;
-        for (auto & engine_arg : arguments)
-            engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, context);
-
-        String zookeeper_path = safeGetLiteralValue<String>(arguments[0], "Replicated");
-        String shard_name = safeGetLiteralValue<String>(arguments[1], "Replicated");
-        String replica_name  = safeGetLiteralValue<String>(arguments[2], "Replicated");
-
-        zookeeper_path = context->getMacros()->expand(zookeeper_path);
-        shard_name = context->getMacros()->expand(shard_name);
-        replica_name = context->getMacros()->expand(replica_name);
-
-        DatabaseReplicatedSettings database_replicated_settings{};
-        if (engine_define->settings)
-            database_replicated_settings.loadFromQuery(*engine_define);
-
-        return std::make_shared<DatabaseReplicated>(database_name, metadata_path, uuid,
-                                                    zookeeper_path, shard_name, replica_name,
-                                                    std::move(database_replicated_settings), context);
-    }
-
-#if USE_LIBPQXX
-
-    else if (engine_name == "PostgreSQL")
-    {
-        const ASTFunction * engine = engine_define->engine;
-        if (!engine->arguments)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
-
-        ASTs & engine_args = engine->arguments->children;
-        auto use_table_cache = false;
-        StoragePostgreSQL::Configuration configuration;
-
-        if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, context))
-        {
-            configuration = StoragePostgreSQL::processNamedCollectionResult(*named_collection, false);
-            use_table_cache = named_collection->getOrDefault<UInt64>("use_table_cache", 0);
-        }
-        else
-        {
-            if (engine_args.size() < 4 || engine_args.size() > 6)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                                "PostgreSQL Database require `host:port`, `database_name`, `username`, `password`"
-                                "[, `schema` = "", `use_table_cache` = 0");
-
-            for (auto & engine_arg : engine_args)
-                engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, context);
-
-            const auto & host_port = safeGetLiteralValue<String>(engine_args[0], engine_name);
-            size_t max_addresses = context->getSettingsRef().glob_expansion_max_elements;
-
-            configuration.addresses = parseRemoteDescriptionForExternalDatabase(host_port, max_addresses, 5432);
-            configuration.database = safeGetLiteralValue<String>(engine_args[1], engine_name);
-            configuration.username = safeGetLiteralValue<String>(engine_args[2], engine_name);
-            configuration.password = safeGetLiteralValue<String>(engine_args[3], engine_name);
-
-            bool is_deprecated_syntax = false;
-            if (engine_args.size() >= 5)
-            {
-                auto arg_value = engine_args[4]->as<ASTLiteral>()->value;
-                if (arg_value.getType() == Field::Types::Which::String)
-                {
-                    configuration.schema = safeGetLiteralValue<String>(engine_args[4], engine_name);
-                }
-                else
-                {
-                    use_table_cache = safeGetLiteralValue<UInt8>(engine_args[4], engine_name);
-                    LOG_WARNING(&Poco::Logger::get("DatabaseFactory"), "A deprecated syntax of PostgreSQL database engine is used");
-                    is_deprecated_syntax = true;
-                }
-            }
-
-            if (!is_deprecated_syntax && engine_args.size() >= 6)
-                use_table_cache = safeGetLiteralValue<UInt8>(engine_args[5], engine_name);
-        }
-
-        const auto & settings = context->getSettingsRef();
-        auto pool = std::make_shared<postgres::PoolWithFailover>(
-            configuration,
-            settings.postgresql_connection_pool_size,
-            settings.postgresql_connection_pool_wait_timeout,
-            POSTGRESQL_POOL_WITH_FAILOVER_DEFAULT_MAX_TRIES,
-            settings.postgresql_connection_pool_auto_close_connection);
-
-        return std::make_shared<DatabasePostgreSQL>(
-            context, metadata_path, engine_define, database_name, configuration, pool, use_table_cache);
-    }
-    else if (engine_name == "MaterializedPostgreSQL")
-    {
-        const ASTFunction * engine = engine_define->engine;
-        if (!engine->arguments)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
-
-        ASTs & engine_args = engine->arguments->children;
-        StoragePostgreSQL::Configuration configuration;
-
-        if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, context))
-        {
-            configuration = StoragePostgreSQL::processNamedCollectionResult(*named_collection, false);
-        }
-        else
-        {
-            if (engine_args.size() != 4)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                                "MaterializedPostgreSQL Database require `host:port`, `database_name`, `username`, `password`.");
-
-            for (auto & engine_arg : engine_args)
-                engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, context);
-
-            auto parsed_host_port = parseAddress(safeGetLiteralValue<String>(engine_args[0], engine_name), 5432);
-
-            configuration.host = parsed_host_port.first;
-            configuration.port = parsed_host_port.second;
-            configuration.database = safeGetLiteralValue<String>(engine_args[1], engine_name);
-            configuration.username = safeGetLiteralValue<String>(engine_args[2], engine_name);
-            configuration.password = safeGetLiteralValue<String>(engine_args[3], engine_name);
-        }
-
-        auto connection_info = postgres::formatConnectionString(
-            configuration.database, configuration.host, configuration.port, configuration.username, configuration.password);
-
-        auto postgresql_replica_settings = std::make_unique<MaterializedPostgreSQLSettings>();
-        if (engine_define->settings)
-            postgresql_replica_settings->loadFromQuery(*engine_define);
-
-        return std::make_shared<DatabaseMaterializedPostgreSQL>(
-                context, metadata_path, uuid, create.attach,
-                database_name, configuration.database, connection_info,
-                std::move(postgresql_replica_settings));
-    }
-
-
-#endif
-
-#if USE_SQLITE
-    else if (engine_name == "SQLite")
-    {
-        const ASTFunction * engine = engine_define->engine;
-
-        if (!engine->arguments || engine->arguments->children.size() != 1)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "SQLite database requires 1 argument: database path");
-
-        const auto & arguments = engine->arguments->children;
-
-        String database_path = safeGetLiteralValue<String>(arguments[0], "SQLite");
-
-        return std::make_shared<DatabaseSQLite>(context, engine_define, create.attach, database_path);
-    }
-#endif
-
-    else if (engine_name == "Filesystem")
-    {
-        const ASTFunction * engine = engine_define->engine;
-
-        /// If init_path is empty, then the current path will be used
-        std::string init_path;
-
-        if (engine->arguments && !engine->arguments->children.empty())
-        {
-            if (engine->arguments->children.size() != 1)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Filesystem database requires at most 1 argument: filesystem_path");
-
-            const auto & arguments = engine->arguments->children;
-            init_path = safeGetLiteralValue<String>(arguments[0], engine_name);
-        }
-
-        return std::make_shared<DatabaseFilesystem>(database_name, init_path, context);
-    }
-
-#if USE_AWS_S3
-    else if (engine_name == "S3")
-    {
-        const ASTFunction * engine = engine_define->engine;
-
-        DatabaseS3::Configuration config;
-
-        if (engine->arguments && !engine->arguments->children.empty())
-        {
-            ASTs & engine_args = engine->arguments->children;
-            config = DatabaseS3::parseArguments(engine_args, context);
-        }
-
-        return std::make_shared<DatabaseS3>(database_name, config, context);
-    }
-#endif
-
-#if USE_HDFS
-    else if (engine_name == "HDFS")
-    {
-        const ASTFunction * engine = engine_define->engine;
-
-        /// If source_url is empty, then table name must contain full url
-        std::string source_url;
-
-        if (engine->arguments && !engine->arguments->children.empty())
-        {
-            if (engine->arguments->children.size() != 1)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "HDFS database requires at most 1 argument: source_url");
-
-            const auto & arguments = engine->arguments->children;
-            source_url = safeGetLiteralValue<String>(arguments[0], engine_name);
-        }
-
-        return std::make_shared<DatabaseHDFS>(database_name, source_url, context);
-    }
-#endif
-
-    throw Exception(ErrorCodes::UNKNOWN_DATABASE_ENGINE, "Unknown database engine: {}", engine_name);
+    const String & engine_name = storage->engine->name;
+
+    bool has_engine_args = false;
+    if (storage->engine->arguments)
+        has_engine_args = true;
+
+    ASTs empty_engine_args;
+    Arguments arguments{
+        .engine_name = engine_name,
+        .engine_args = has_engine_args ? storage->engine->arguments->children : empty_engine_args,
+        .create_query = create,
+        .database_name = database_name,
+        .metadata_path = metadata_path,
+        .uuid = create.uuid,
+        .context = context};
+
+    // creator_fn creates and returns a DatabasePtr with the supplied arguments
+    auto creator_fn = database_engines.at(engine_name);
+
+    return creator_fn(arguments);
 }
 
 }
diff --git a/src/Databases/DatabaseFactory.h b/src/Databases/DatabaseFactory.h
index cb631cd76d0..c86eaddb29d 100644
--- a/src/Databases/DatabaseFactory.h
+++ b/src/Databases/DatabaseFactory.h
@@ -2,18 +2,60 @@
 
 #include <Interpreters/Context_fwd.h>
 #include <Databases/IDatabase.h>
+#include <Parsers/ASTCreateQuery.h>
+#include <Parsers/ASTLiteral.h>
 
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+}
+
 class ASTCreateQuery;
 
-class DatabaseFactory
+template <typename ValueType>
+static inline ValueType safeGetLiteralValue(const ASTPtr &ast, const String &engine_name)
+{
+    if (!ast || !ast->as<ASTLiteral>())
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database engine {} requested literal argument.", engine_name);
+
+    return ast->as<ASTLiteral>()->value.safeGet<ValueType>();
+}
+
+class DatabaseFactory : private boost::noncopyable
 {
 public:
-    static DatabasePtr get(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context);
 
-    static DatabasePtr getImpl(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context);
+    static DatabaseFactory & instance();
+
+    struct Arguments
+    {
+        const String & engine_name;
+        ASTs & engine_args;
+        ASTStorage * storage;
+        const ASTCreateQuery & create_query;
+        const String & database_name;
+        const String & metadata_path;
+        const UUID & uuid;
+        ContextPtr & context;
+    };
+
+    DatabasePtr get(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context);
+
+    using CreatorFn = std::function<DatabasePtr(const Arguments & arguments)>;
+
+    using DatabaseEngines = std::unordered_map<std::string, CreatorFn>;
+
+    void registerDatabase(const std::string & name, CreatorFn creator_fn);
+
+    const DatabaseEngines & getDatabaseEngines() const { return database_engines; }
+
+private:
+    DatabaseEngines database_engines;
+
+    DatabasePtr getImpl(const ASTCreateQuery & create, const String & metadata_path, ContextPtr context);
 };
 
 }
diff --git a/src/Databases/DatabaseFilesystem.cpp b/src/Databases/DatabaseFilesystem.cpp
index ca1b5b27a59..5564f1d07cf 100644
--- a/src/Databases/DatabaseFilesystem.cpp
+++ b/src/Databases/DatabaseFilesystem.cpp
@@ -1,3 +1,4 @@
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseFilesystem.h>
 
 #include <IO/Operators.h>
@@ -237,4 +238,28 @@ DatabaseTablesIteratorPtr DatabaseFilesystem::getTablesIterator(ContextPtr, cons
     return std::make_unique<DatabaseTablesSnapshotIterator>(Tables{}, getDatabaseName());
 }
 
+void registerDatabaseFilesystem(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+        const String & engine_name = engine_define->engine->name;
+
+        /// If init_path is empty, then the current path will be used
+        std::string init_path;
+
+        if (engine->arguments && !engine->arguments->children.empty())
+        {
+            if (engine->arguments->children.size() != 1)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Filesystem database requires at most 1 argument: filesystem_path");
+
+            const auto & arguments = engine->arguments->children;
+            init_path = safeGetLiteralValue<String>(arguments[0], engine_name);
+        }
+
+        return std::make_shared<DatabaseFilesystem>(args.database_name, init_path, args.context);
+    };
+    factory.registerDatabase("Filesystem", create_fn);
+}
 }
diff --git a/src/Databases/DatabaseHDFS.cpp b/src/Databases/DatabaseHDFS.cpp
index 750d79c8493..6810f655116 100644
--- a/src/Databases/DatabaseHDFS.cpp
+++ b/src/Databases/DatabaseHDFS.cpp
@@ -2,6 +2,7 @@
 
 #if USE_HDFS
 
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseHDFS.h>
 
 #include <Interpreters/Context.h>
@@ -237,6 +238,30 @@ DatabaseTablesIteratorPtr DatabaseHDFS::getTablesIterator(ContextPtr, const Filt
     return std::make_unique<DatabaseTablesSnapshotIterator>(Tables{}, getDatabaseName());
 }
 
+void registerDatabaseHDFS(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+        const String & engine_name = engine_define->engine->name;
+
+        /// If source_url is empty, then table name must contain full url
+        std::string source_url;
+
+        if (engine->arguments && !engine->arguments->children.empty())
+        {
+            if (engine->arguments->children.size() != 1)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "HDFS database requires at most 1 argument: source_url");
+
+            const auto & arguments = engine->arguments->children;
+            source_url = safeGetLiteralValue<String>(arguments[0], engine_name);
+        }
+
+        return std::make_shared<DatabaseHDFS>(args.database_name, source_url, args.context);
+    };
+    factory.registerDatabase("HDFS", create_fn);
+}
 } // DB
 
 #endif
diff --git a/src/Databases/DatabaseLazy.cpp b/src/Databases/DatabaseLazy.cpp
index 896ae99656f..fcd832e7cc2 100644
--- a/src/Databases/DatabaseLazy.cpp
+++ b/src/Databases/DatabaseLazy.cpp
@@ -1,4 +1,5 @@
 #include <Core/Settings.h>
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseLazy.h>
 #include <Databases/DatabaseOnDisk.h>
 #include <Databases/DatabasesCommon.h>
@@ -7,6 +8,7 @@
 #include <IO/WriteBufferFromFile.h>
 #include <IO/WriteHelpers.h>
 #include <Parsers/ASTCreateQuery.h>
+#include <Parsers/ASTFunction.h>
 #include <Storages/IStorage.h>
 #include <Common/escapeForFileName.h>
 
@@ -18,6 +20,13 @@
 
 namespace fs = std::filesystem;
 
+
+namespace CurrentMetrics
+{
+    extern const Metric AttachedTable;
+}
+
+
 namespace DB
 {
 
@@ -27,6 +36,7 @@ namespace ErrorCodes
     extern const int UNKNOWN_TABLE;
     extern const int UNSUPPORTED_METHOD;
     extern const int LOGICAL_ERROR;
+    extern const int BAD_ARGUMENTS;
 }
 
 
@@ -174,6 +184,7 @@ void DatabaseLazy::attachTable(ContextPtr /* context_ */, const String & table_n
         throw Exception(ErrorCodes::TABLE_ALREADY_EXISTS, "Table {}.{} already exists.", backQuote(database_name), backQuote(table_name));
 
     it->second.expiration_iterator = cache_expiration_queue.emplace(cache_expiration_queue.end(), current_time, table_name);
+    CurrentMetrics::add(CurrentMetrics::AttachedTable, 1);
 }
 
 StoragePtr DatabaseLazy::detachTable(ContextPtr /* context */, const String & table_name)
@@ -189,6 +200,7 @@ StoragePtr DatabaseLazy::detachTable(ContextPtr /* context */, const String & ta
         if (it->second.expiration_iterator != cache_expiration_queue.end())
             cache_expiration_queue.erase(it->second.expiration_iterator);
         tables_cache.erase(it);
+        CurrentMetrics::sub(CurrentMetrics::AttachedTable, 1);
     }
     return res;
 }
@@ -345,4 +357,26 @@ const StoragePtr & DatabaseLazyIterator::table() const
     return current_storage;
 }
 
+void registerDatabaseLazy(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+
+        if (!engine->arguments || engine->arguments->children.size() != 1)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Lazy database require cache_expiration_time_seconds argument");
+
+        const auto & arguments = engine->arguments->children;
+
+        const auto cache_expiration_time_seconds = safeGetLiteralValue<UInt64>(arguments[0], "Lazy");
+
+        return make_shared<DatabaseLazy>(
+            args.database_name,
+            args.metadata_path,
+            cache_expiration_time_seconds,
+            args.context);
+    };
+    factory.registerDatabase("Lazy", create_fn);
+}
 }
diff --git a/src/Databases/DatabaseMemory.cpp b/src/Databases/DatabaseMemory.cpp
index 2a7a2ad8ccc..794eebbc399 100644
--- a/src/Databases/DatabaseMemory.cpp
+++ b/src/Databases/DatabaseMemory.cpp
@@ -1,5 +1,6 @@
 #include <base/scope_guard.h>
 #include <Common/logger_useful.h>
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseMemory.h>
 #include <Databases/DatabasesCommon.h>
 #include <Databases/DDLDependencyVisitor.h>
@@ -209,4 +210,15 @@ std::vector<std::pair<ASTPtr, StoragePtr>> DatabaseMemory::getTablesForBackup(co
     return res;
 }
 
+void registerDatabaseMemory(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        return make_shared<DatabaseMemory>(
+            args.database_name,
+            args.context);
+    };
+    factory.registerDatabase("Memory", create_fn);
+}
+
 }
diff --git a/src/Databases/DatabaseOnDisk.cpp b/src/Databases/DatabaseOnDisk.cpp
index f5f30d0e977..12b0dc07799 100644
--- a/src/Databases/DatabaseOnDisk.cpp
+++ b/src/Databases/DatabaseOnDisk.cpp
@@ -675,8 +675,11 @@ ASTPtr DatabaseOnDisk::parseQueryFromMetadata(
         if (errno == ENOENT && !throw_on_error)
             return nullptr;
 
-        throwFromErrnoWithPath("Cannot open file " + metadata_file_path, metadata_file_path,
-                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE,
+            metadata_file_path,
+            "Cannot open file {}",
+            metadata_file_path);
     }
 
     ReadBufferFromFile in(metadata_file_fd, metadata_file_path, METADATA_FILE_BUFFER_SIZE);
diff --git a/src/Databases/DatabaseOrdinary.cpp b/src/Databases/DatabaseOrdinary.cpp
index 1f344551c5e..8973b533720 100644
--- a/src/Databases/DatabaseOrdinary.cpp
+++ b/src/Databases/DatabaseOrdinary.cpp
@@ -1,6 +1,7 @@
 #include <filesystem>
 
 #include <Core/Settings.h>
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseOnDisk.h>
 #include <Databases/DatabaseOrdinary.h>
 #include <Databases/DatabasesCommon.h>
@@ -37,6 +38,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
+    extern const int UNKNOWN_DATABASE_ENGINE;
 }
 
 static constexpr size_t METADATA_FILE_BUFFER_SIZE = 32768;
@@ -139,6 +141,8 @@ void DatabaseOrdinary::loadTableFromMetadata(
     assert(name.database == TSA_SUPPRESS_WARNING_FOR_READ(database_name));
     const auto & query = ast->as<const ASTCreateQuery &>();
 
+    LOG_TRACE(log, "Loading table {}", name.getFullName());
+
     try
     {
         auto [table_name, table] = createTableFromAST(
@@ -319,4 +323,19 @@ void DatabaseOrdinary::commitAlterTable(const StorageID &, const String & table_
     }
 }
 
+void registerDatabaseOrdinary(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        if (!args.create_query.attach && !args.context->getSettingsRef().allow_deprecated_database_ordinary)
+            throw Exception(
+                ErrorCodes::UNKNOWN_DATABASE_ENGINE,
+                "Ordinary database engine is deprecated (see also allow_deprecated_database_ordinary setting)");
+        return make_shared<DatabaseOrdinary>(
+            args.database_name,
+            args.metadata_path,
+            args.context);
+    };
+    factory.registerDatabase("Ordinary", create_fn);
+}
 }
diff --git a/src/Databases/DatabaseReplicated.cpp b/src/Databases/DatabaseReplicated.cpp
index 36dd858dcf7..d484b223706 100644
--- a/src/Databases/DatabaseReplicated.cpp
+++ b/src/Databases/DatabaseReplicated.cpp
@@ -13,6 +13,7 @@
 #include <Common/ZooKeeper/Types.h>
 #include <Common/ZooKeeper/ZooKeeper.h>
 #include <Common/PoolId.h>
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseReplicated.h>
 #include <Databases/DatabaseReplicatedWorker.h>
 #include <Databases/DDLDependencyVisitor.h>
@@ -1054,7 +1055,7 @@ void DatabaseReplicated::recoverLostReplica(const ZooKeeperPtr & current_zookeep
     for (auto & [_, intermediate, to] : replicated_tables_to_rename)
         rename_table(intermediate, to);
 
-    LOG_DEBUG(log, "Renames completed succesessfully");
+    LOG_DEBUG(log, "Renames completed successfully");
 
     for (const auto & id : dropped_tables)
         DatabaseCatalog::instance().waitTableFinallyDropped(id);
@@ -1204,7 +1205,7 @@ ASTPtr DatabaseReplicated::parseQueryFromMetadataInZooKeeper(const String & node
 }
 
 void DatabaseReplicated::dropReplica(
-    DatabaseReplicated * database, const String & database_zookeeper_path, const String & shard, const String & replica)
+    DatabaseReplicated * database, const String & database_zookeeper_path, const String & shard, const String & replica, bool throw_if_noop)
 {
     assert(!database || database_zookeeper_path == database->zookeeper_path);
 
@@ -1215,14 +1216,21 @@ void DatabaseReplicated::dropReplica(
 
     auto zookeeper = Context::getGlobalContextInstance()->getZooKeeper();
 
-    String database_mark = zookeeper->get(database_zookeeper_path);
+    String database_mark;
+    bool db_path_exists = zookeeper->tryGet(database_zookeeper_path, database_mark);
+    if (!db_path_exists && !throw_if_noop)
+        return;
     if (database_mark != REPLICATED_DATABASE_MARK)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Path {} does not look like a path of Replicated database", database_zookeeper_path);
 
     String database_replica_path = fs::path(database_zookeeper_path) / "replicas" / full_replica_name;
     if (!zookeeper->exists(database_replica_path))
+    {
+        if (!throw_if_noop)
+            return;
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Replica {} does not exist (database path: {})",
                         full_replica_name, database_zookeeper_path);
+    }
 
     if (zookeeper->exists(database_replica_path + "/active"))
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Replica {} is active, cannot drop it (database path: {})",
@@ -1645,4 +1653,41 @@ bool DatabaseReplicated::shouldReplicateQuery(const ContextPtr & query_context,
     return true;
 }
 
+void registerDatabaseReplicated(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+
+        if (!engine->arguments || engine->arguments->children.size() != 3)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Replicated database requires 3 arguments: zookeeper path, shard name and replica name");
+
+        auto & arguments = engine->arguments->children;
+        for (auto & engine_arg : arguments)
+            engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, args.context);
+
+        String zookeeper_path = safeGetLiteralValue<String>(arguments[0], "Replicated");
+        String shard_name = safeGetLiteralValue<String>(arguments[1], "Replicated");
+        String replica_name  = safeGetLiteralValue<String>(arguments[2], "Replicated");
+
+        zookeeper_path = args.context->getMacros()->expand(zookeeper_path);
+        shard_name = args.context->getMacros()->expand(shard_name);
+        replica_name = args.context->getMacros()->expand(replica_name);
+
+        DatabaseReplicatedSettings database_replicated_settings{};
+        if (engine_define->settings)
+            database_replicated_settings.loadFromQuery(*engine_define);
+
+        return std::make_shared<DatabaseReplicated>(
+            args.database_name,
+            args.metadata_path,
+            args.uuid,
+            zookeeper_path,
+            shard_name,
+            replica_name,
+            std::move(database_replicated_settings), args.context);
+    };
+    factory.registerDatabase("Replicated", create_fn);
+}
 }
diff --git a/src/Databases/DatabaseReplicated.h b/src/Databases/DatabaseReplicated.h
index 202f5cc5c14..8a3999e70e9 100644
--- a/src/Databases/DatabaseReplicated.h
+++ b/src/Databases/DatabaseReplicated.h
@@ -79,7 +79,7 @@ public:
 
     bool shouldReplicateQuery(const ContextPtr & query_context, const ASTPtr & query_ptr) const override;
 
-    static void dropReplica(DatabaseReplicated * database, const String & database_zookeeper_path, const String & shard, const String & replica);
+    static void dropReplica(DatabaseReplicated * database, const String & database_zookeeper_path, const String & shard, const String & replica, bool throw_if_noop);
 
     std::vector<UInt8> tryGetAreReplicasActive(const ClusterPtr & cluster_) const;
 
diff --git a/src/Databases/DatabaseReplicatedWorker.cpp b/src/Databases/DatabaseReplicatedWorker.cpp
index 5f103a52a61..2056b403ff6 100644
--- a/src/Databases/DatabaseReplicatedWorker.cpp
+++ b/src/Databases/DatabaseReplicatedWorker.cpp
@@ -74,7 +74,7 @@ void DatabaseReplicatedDDLWorker::initializeReplication()
     /// Create "active" node (remove previous one if necessary)
     String active_path = fs::path(database->replica_path) / "active";
     String active_id = toString(ServerUUID::get());
-    zookeeper->handleEphemeralNodeExistence(active_path, active_id);
+    zookeeper->deleteEphemeralNodeIfContentMatches(active_path, active_id);
     zookeeper->create(active_path, active_id, zkutil::CreateMode::Ephemeral);
     active_node_holder.reset();
     active_node_holder_zookeeper = zookeeper;
diff --git a/src/Databases/DatabaseS3.cpp b/src/Databases/DatabaseS3.cpp
index 11655f5f100..1721b0e9e97 100644
--- a/src/Databases/DatabaseS3.cpp
+++ b/src/Databases/DatabaseS3.cpp
@@ -2,6 +2,7 @@
 
 #if USE_AWS_S3
 
+#include <Databases/DatabaseFactory.h>
 #include <Databases/DatabaseS3.h>
 
 #include <Interpreters/Context.h>
@@ -255,7 +256,7 @@ DatabaseS3::Configuration DatabaseS3::parseArguments(ASTs engine_args, ContextPt
             arg = evaluateConstantExpressionOrIdentifierAsLiteral(arg, context_);
 
         if (engine_args.size() > 3)
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, error_message.c_str());
+            throw Exception::createRuntime(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, error_message.c_str());
 
         if (engine_args.empty())
             return result;
@@ -269,7 +270,7 @@ DatabaseS3::Configuration DatabaseS3::parseArguments(ASTs engine_args, ContextPt
             if (boost::iequals(second_arg, "NOSIGN"))
                 result.no_sign_request = true;
             else
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, error_message.c_str());
+                throw Exception::createRuntime(ErrorCodes::BAD_ARGUMENTS, error_message.c_str());
         }
 
         // url, access_key_id, secret_access_key
@@ -279,7 +280,7 @@ DatabaseS3::Configuration DatabaseS3::parseArguments(ASTs engine_args, ContextPt
             auto secret_key = checkAndGetLiteralArgument<String>(engine_args[2], "secret_access_key");
 
             if (key_id.empty() || secret_key.empty() || boost::iequals(key_id, "NOSIGN"))
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, error_message.c_str());
+                throw Exception::createRuntime(ErrorCodes::BAD_ARGUMENTS, error_message.c_str());
 
             result.access_key_id = key_id;
             result.secret_access_key = secret_key;
@@ -307,6 +308,24 @@ DatabaseTablesIteratorPtr DatabaseS3::getTablesIterator(ContextPtr, const Filter
     return std::make_unique<DatabaseTablesSnapshotIterator>(Tables{}, getDatabaseName());
 }
 
-}
+void registerDatabaseS3(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
 
+        DatabaseS3::Configuration config;
+
+        if (engine->arguments && !engine->arguments->children.empty())
+        {
+            ASTs & engine_args = engine->arguments->children;
+            config = DatabaseS3::parseArguments(engine_args, args.context);
+        }
+
+        return std::make_shared<DatabaseS3>(args.database_name, config, args.context);
+    };
+    factory.registerDatabase("S3", create_fn);
+}
+}
 #endif
diff --git a/src/Databases/DatabasesCommon.cpp b/src/Databases/DatabasesCommon.cpp
index 7bc445c5b5d..bda48737621 100644
--- a/src/Databases/DatabasesCommon.cpp
+++ b/src/Databases/DatabasesCommon.cpp
@@ -8,11 +8,17 @@
 #include <Storages/StorageDictionary.h>
 #include <Storages/StorageFactory.h>
 #include <Common/typeid_cast.h>
+#include <Common/CurrentMetrics.h>
 #include <Common/escapeForFileName.h>
 #include <TableFunctions/TableFunctionFactory.h>
 #include <Backups/BackupEntriesCollector.h>
 #include <Backups/RestorerFromBackup.h>
 
+namespace CurrentMetrics
+{
+    extern const Metric AttachedTable;
+}
+
 
 namespace DB
 {
@@ -59,6 +65,11 @@ void applyMetadataChangesToCreateQuery(const ASTPtr & query, const StorageInMemo
         query->replace(ast_create_query.select, metadata.select.select_query);
     }
 
+    if (metadata.refresh)
+    {
+        query->replace(ast_create_query.refresh_strategy, metadata.refresh);
+    }
+
     /// MaterializedView, Dictionary are types of CREATE query without storage.
     if (ast_create_query.storage)
     {
@@ -239,6 +250,7 @@ StoragePtr DatabaseWithOwnTablesBase::detachTableUnlocked(const String & table_n
     res = it->second;
     tables.erase(it);
     res->is_detached = true;
+    CurrentMetrics::sub(CurrentMetrics::AttachedTable, 1);
 
     auto table_id = res->getStorageID();
     if (table_id.hasUUID())
@@ -279,6 +291,7 @@ void DatabaseWithOwnTablesBase::attachTableUnlocked(const String & table_name, c
     /// It is important to reset is_detached here since in case of RENAME in
     /// non-Atomic database the is_detached is set to true before RENAME.
     table->is_detached = false;
+    CurrentMetrics::add(CurrentMetrics::AttachedTable, 1);
 }
 
 void DatabaseWithOwnTablesBase::shutdown()
diff --git a/src/Databases/IDatabase.cpp b/src/Databases/IDatabase.cpp
index 09640d2f86e..ae8fc58bf89 100644
--- a/src/Databases/IDatabase.cpp
+++ b/src/Databases/IDatabase.cpp
@@ -5,8 +5,14 @@
 #include <Common/quoteString.h>
 #include <Interpreters/DatabaseCatalog.h>
 #include <Common/NamePrompter.h>
+#include <Common/CurrentMetrics.h>
 
 
+namespace CurrentMetrics
+{
+    extern const Metric AttachedDatabase;
+}
+
 namespace DB
 {
 
@@ -21,12 +27,31 @@ StoragePtr IDatabase::getTable(const String & name, ContextPtr context) const
 {
     if (auto storage = tryGetTable(name, context))
         return storage;
+
     TableNameHints hints(this->shared_from_this(), context);
-    std::vector<String> names = hints.getHints(name);
-    if (names.empty())
+    /// hint is a pair which holds a single database_name and table_name suggestion for the given table name.
+    auto hint = hints.getHintForTable(name);
+
+    if (hint.first.empty())
         throw Exception(ErrorCodes::UNKNOWN_TABLE, "Table {}.{} does not exist", backQuoteIfNeed(getDatabaseName()), backQuoteIfNeed(name));
     else
-        throw Exception(ErrorCodes::UNKNOWN_TABLE, "Table {}.{} does not exist. Maybe you meant {}?", backQuoteIfNeed(getDatabaseName()), backQuoteIfNeed(name), backQuoteIfNeed(names[0]));
+        throw Exception(
+            ErrorCodes::UNKNOWN_TABLE,
+            "Table {}.{} does not exist. Maybe you meant {}.{}?",
+            backQuoteIfNeed(getDatabaseName()),
+            backQuoteIfNeed(name),
+            backQuoteIfNeed(hint.first),
+            backQuoteIfNeed(hint.second));
+}
+
+IDatabase::IDatabase(String database_name_) : database_name(std::move(database_name_))
+{
+    CurrentMetrics::add(CurrentMetrics::AttachedDatabase, 1);
+}
+
+IDatabase::~IDatabase()
+{
+    CurrentMetrics::sub(CurrentMetrics::AttachedDatabase, 1);
 }
 
 std::vector<std::pair<ASTPtr, StoragePtr>> IDatabase::getTablesForBackup(const FilterByNameFunction &, const ContextPtr &) const
diff --git a/src/Databases/IDatabase.h b/src/Databases/IDatabase.h
index e5afa0eb944..15e453371b7 100644
--- a/src/Databases/IDatabase.h
+++ b/src/Databases/IDatabase.h
@@ -139,7 +139,7 @@ class IDatabase : public std::enable_shared_from_this<IDatabase>
 {
 public:
     IDatabase() = delete;
-    explicit IDatabase(String database_name_) : database_name(std::move(database_name_)) {}
+    explicit IDatabase(String database_name_);
 
     /// Get name of database engine.
     virtual String getEngineName() const = 0;
@@ -420,7 +420,7 @@ public:
     /// Creates a table restored from backup.
     virtual void createTableRestoredFromBackup(const ASTPtr & create_table_query, ContextMutablePtr context, std::shared_ptr<IRestoreCoordination> restore_coordination, UInt64 timeout_ms);
 
-    virtual ~IDatabase() = default;
+    virtual ~IDatabase();
 
 protected:
     virtual ASTPtr getCreateTableQueryImpl(const String & /*name*/, ContextPtr /*context*/, bool throw_on_error) const
diff --git a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
index a31e74cc7ae..cbb080a0baa 100644
--- a/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
+++ b/src/Databases/MySQL/DatabaseMaterializedMySQL.cpp
@@ -2,13 +2,20 @@
 
 #if USE_MYSQL
 
+#    include <Common/parseAddress.h>
+#    include <Common/parseRemoteDescription.h>
 #    include <Databases/MySQL/DatabaseMaterializedMySQL.h>
 
-#    include <Interpreters/Context.h>
+#    include <Interpreters/evaluateConstantExpression.h>
+#    include <Databases/DatabaseFactory.h>
 #    include <Databases/MySQL/DatabaseMaterializedTablesIterator.h>
 #    include <Databases/MySQL/MaterializedMySQLSyncThread.h>
 #    include <Parsers/ASTCreateQuery.h>
+#    include <Parsers/ASTFunction.h>
+#    include <Parsers/queryToString.h>
+#    include <Storages/StorageMySQL.h>
 #    include <Storages/StorageMaterializedMySQL.h>
+#    include <Storages/NamedCollectionsHelpers.h>
 #    include <Common/setThreadName.h>
 #    include <Common/PoolId.h>
 #    include <filesystem>
@@ -21,6 +28,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int NOT_IMPLEMENTED;
+    extern const int BAD_ARGUMENTS;
 }
 
 DatabaseMaterializedMySQL::DatabaseMaterializedMySQL(
@@ -179,6 +187,86 @@ void DatabaseMaterializedMySQL::stopReplication()
     started_up = false;
 }
 
+void registerDatabaseMaterializedMySQL(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+        const String & engine_name = engine_define->engine->name;
+
+        if (!engine->arguments)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
+        StorageMySQL::Configuration configuration;
+        ASTs & arguments = engine->arguments->children;
+        auto mysql_settings = std::make_unique<MySQLSettings>();
+
+        if (auto named_collection = tryGetNamedCollectionWithOverrides(arguments, args.context))
+        {
+            configuration = StorageMySQL::processNamedCollectionResult(*named_collection, *mysql_settings, args.context, false);
+        }
+        else
+        {
+            if (arguments.size() != 4)
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "MySQL database require mysql_hostname, mysql_database_name, mysql_username, mysql_password arguments.");
+
+
+            arguments[1] = evaluateConstantExpressionOrIdentifierAsLiteral(arguments[1], args.context);
+            const auto & host_port = safeGetLiteralValue<String>(arguments[0], engine_name);
+
+            if (engine_name == "MySQL")
+            {
+                size_t max_addresses = args.context->getSettingsRef().glob_expansion_max_elements;
+                configuration.addresses = parseRemoteDescriptionForExternalDatabase(host_port, max_addresses, 3306);
+            }
+            else
+            {
+                const auto & [remote_host, remote_port] = parseAddress(host_port, 3306);
+                configuration.host = remote_host;
+                configuration.port = remote_port;
+            }
+
+            configuration.database = safeGetLiteralValue<String>(arguments[1], engine_name);
+            configuration.username = safeGetLiteralValue<String>(arguments[2], engine_name);
+            configuration.password = safeGetLiteralValue<String>(arguments[3], engine_name);
+        }
+        MySQLClient client(configuration.host, configuration.port, configuration.username, configuration.password);
+        auto mysql_pool
+            = mysqlxx::Pool(configuration.database, configuration.host, configuration.username, configuration.password, configuration.port);
+
+        auto materialize_mode_settings = std::make_unique<MaterializedMySQLSettings>();
+
+        if (engine_define->settings)
+            materialize_mode_settings->loadFromQuery(*engine_define);
+
+        if (args.uuid == UUIDHelpers::Nil)
+        {
+            auto print_create_ast = args.create_query.clone();
+            print_create_ast->as<ASTCreateQuery>()->attach = false;
+            throw Exception(
+                ErrorCodes::NOT_IMPLEMENTED,
+                "The MaterializedMySQL database engine no longer supports Ordinary databases. To re-create the database, delete "
+                "the old one by executing \"rm -rf {}{{,.sql}}\", then re-create the database with the following query: {}",
+                args.metadata_path,
+                queryToString(print_create_ast));
+        }
+
+        return make_shared<DatabaseMaterializedMySQL>(
+            args.context,
+            args.database_name,
+            args.metadata_path,
+            args.uuid,
+            configuration.database,
+            std::move(mysql_pool),
+            std::move(client),
+            std::move(materialize_mode_settings));
+    };
+    factory.registerDatabase("MaterializeMySQL", create_fn);
+    factory.registerDatabase("MaterializedMySQL", create_fn);
+}
+
 }
 
 #endif
diff --git a/src/Databases/MySQL/DatabaseMySQL.cpp b/src/Databases/MySQL/DatabaseMySQL.cpp
index 7d2ed7a9662..96a5c3a18ce 100644
--- a/src/Databases/MySQL/DatabaseMySQL.cpp
+++ b/src/Databases/MySQL/DatabaseMySQL.cpp
@@ -2,6 +2,7 @@
 
 #if USE_MYSQL
 #    include <string>
+#    include <Databases/DatabaseFactory.h>
 #    include <DataTypes/DataTypeDateTime.h>
 #    include <DataTypes/DataTypeNullable.h>
 #    include <DataTypes/DataTypeString.h>
@@ -14,6 +15,7 @@
 #    include <QueryPipeline/QueryPipelineBuilder.h>
 #    include <IO/Operators.h>
 #    include <Interpreters/Context.h>
+#    include <Interpreters/evaluateConstantExpression.h>
 #    include <Parsers/ASTCreateQuery.h>
 #    include <Parsers/ASTFunction.h>
 #    include <Parsers/ParserCreateQuery.h>
@@ -21,8 +23,11 @@
 #    include <Parsers/queryToString.h>
 #    include <Storages/StorageMySQL.h>
 #    include <Storages/MySQL/MySQLSettings.h>
+#    include <Storages/MySQL/MySQLHelpers.h>
+#    include <Storages/NamedCollectionsHelpers.h>
 #    include <Common/escapeForFileName.h>
 #    include <Common/parseAddress.h>
+#    include <Common/parseRemoteDescription.h>
 #    include <Common/setThreadName.h>
 #    include <filesystem>
 #    include <Common/filesystemHelpers.h>
@@ -41,6 +46,8 @@ namespace ErrorCodes
     extern const int TABLE_IS_DROPPED;
     extern const int TABLE_ALREADY_EXISTS;
     extern const int UNEXPECTED_AST_STRUCTURE;
+    extern const int CANNOT_CREATE_DATABASE;
+    extern const int BAD_ARGUMENTS;
 }
 
 constexpr static const auto suffix = ".remove_flag";
@@ -504,6 +511,77 @@ void DatabaseMySQL::createTable(ContextPtr local_context, const String & table_n
     attachTable(local_context, table_name, storage, {});
 }
 
+void registerDatabaseMySQL(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+        const String & engine_name = engine_define->engine->name;
+        if (!engine->arguments)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
+
+        StorageMySQL::Configuration configuration;
+        ASTs & arguments = engine->arguments->children;
+        auto mysql_settings = std::make_unique<MySQLSettings>();
+
+        if (auto named_collection = tryGetNamedCollectionWithOverrides(arguments, args.context))
+        {
+            configuration = StorageMySQL::processNamedCollectionResult(*named_collection, *mysql_settings, args.context, false);
+        }
+        else
+        {
+            if (arguments.size() != 4)
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "MySQL database require mysql_hostname, mysql_database_name, mysql_username, mysql_password arguments.");
+
+
+            arguments[1] = evaluateConstantExpressionOrIdentifierAsLiteral(arguments[1], args.context);
+            const auto & host_port = safeGetLiteralValue<String>(arguments[0], engine_name);
+
+            if (engine_name == "MySQL")
+            {
+                size_t max_addresses = args.context->getSettingsRef().glob_expansion_max_elements;
+                configuration.addresses = parseRemoteDescriptionForExternalDatabase(host_port, max_addresses, 3306);
+            }
+            else
+            {
+                const auto & [remote_host, remote_port] = parseAddress(host_port, 3306);
+                configuration.host = remote_host;
+                configuration.port = remote_port;
+            }
+
+            configuration.database = safeGetLiteralValue<String>(arguments[1], engine_name);
+            configuration.username = safeGetLiteralValue<String>(arguments[2], engine_name);
+            configuration.password = safeGetLiteralValue<String>(arguments[3], engine_name);
+        }
+        mysql_settings->loadFromQueryContext(args.context, *engine_define);
+        if (engine_define->settings)
+            mysql_settings->loadFromQuery(*engine_define);
+
+        auto mysql_pool = createMySQLPoolWithFailover(configuration, *mysql_settings);
+
+        try
+        {
+            return make_shared<DatabaseMySQL>(
+                args.context,
+                args.database_name,
+                args.metadata_path,
+                engine_define,
+                configuration.database,
+                std::move(mysql_settings),
+                std::move(mysql_pool),
+                args.create_query.attach);
+        }
+        catch (...)
+        {
+            const auto & exception_message = getCurrentExceptionMessage(true);
+            throw Exception(ErrorCodes::CANNOT_CREATE_DATABASE, "Cannot create MySQL database, because {}", exception_message);
+        }
+    };
+    factory.registerDatabase("MySQL", create_fn);
+}
 }
 
 #endif
diff --git a/src/Databases/PostgreSQL/DatabaseMaterializedPostgreSQL.cpp b/src/Databases/PostgreSQL/DatabaseMaterializedPostgreSQL.cpp
index 78be0611631..a659821e179 100644
--- a/src/Databases/PostgreSQL/DatabaseMaterializedPostgreSQL.cpp
+++ b/src/Databases/PostgreSQL/DatabaseMaterializedPostgreSQL.cpp
@@ -8,23 +8,25 @@
 #include <Common/logger_useful.h>
 #include <Common/Macros.h>
 #include <Common/PoolId.h>
+#include <Common/parseAddress.h>
+#include <Common/parseRemoteDescription.h>
 #include <Core/UUID.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeArray.h>
 #include <Databases/DatabaseOrdinary.h>
 #include <Databases/DatabaseAtomic.h>
+#include <Databases/DatabaseFactory.h>
+#include <Storages/NamedCollectionsHelpers.h>
 #include <Storages/StoragePostgreSQL.h>
 #include <Storages/AlterCommands.h>
 #include <Interpreters/Context.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTFunction.h>
-#include <Parsers/ParserCreateQuery.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
+#include <Interpreters/evaluateConstantExpression.h>
 #include <Interpreters/InterpreterAlterQuery.h>
 #include <Common/escapeForFileName.h>
-#include <Poco/DirectoryIterator.h>
-#include <Poco/File.h>
 
 namespace DB
 {
@@ -471,6 +473,59 @@ DatabaseTablesIteratorPtr DatabaseMaterializedPostgreSQL::getTablesIterator(
     return DatabaseAtomic::getTablesIterator(StorageMaterializedPostgreSQL::makeNestedTableContext(local_context), filter_by_table_name);
 }
 
+void registerDatabaseMaterializedPostgreSQL(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+        ASTs & engine_args = engine->arguments->children;
+        const String & engine_name = engine_define->engine->name;
+
+        if (!engine->arguments)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
+
+        StoragePostgreSQL::Configuration configuration;
+
+        if (!engine->arguments)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
+
+        if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, args.context))
+        {
+            configuration = StoragePostgreSQL::processNamedCollectionResult(*named_collection, args.context, false);
+        }
+        else
+        {
+            if (engine_args.size() != 4)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                                "MaterializedPostgreSQL Database require `host:port`, `database_name`, `username`, `password`.");
+
+            for (auto & engine_arg : engine_args)
+                engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, args.context);
+
+            auto parsed_host_port = parseAddress(safeGetLiteralValue<String>(engine_args[0], engine_name), 5432);
+
+            configuration.host = parsed_host_port.first;
+            configuration.port = parsed_host_port.second;
+            configuration.database = safeGetLiteralValue<String>(engine_args[1], engine_name);
+            configuration.username = safeGetLiteralValue<String>(engine_args[2], engine_name);
+            configuration.password = safeGetLiteralValue<String>(engine_args[3], engine_name);
+        }
+
+        auto connection_info = postgres::formatConnectionString(
+            configuration.database, configuration.host, configuration.port, configuration.username, configuration.password);
+
+        auto postgresql_replica_settings = std::make_unique<MaterializedPostgreSQLSettings>();
+        if (engine_define->settings)
+            postgresql_replica_settings->loadFromQuery(*engine_define);
+
+        return std::make_shared<DatabaseMaterializedPostgreSQL>(
+            args.context, args.metadata_path, args.uuid, args.create_query.attach,
+            args.database_name, configuration.database, connection_info,
+            std::move(postgresql_replica_settings));
+    };
+    factory.registerDatabase("MaterializedPostgreSQL", create_fn);
+}
 }
 
 #endif
diff --git a/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp b/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp
index 24f04c16029..1fe5c078581 100644
--- a/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp
+++ b/src/Databases/PostgreSQL/DatabasePostgreSQL.cpp
@@ -6,14 +6,18 @@
 
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeArray.h>
+#include <Storages/NamedCollectionsHelpers.h>
 #include <Storages/StoragePostgreSQL.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/evaluateConstantExpression.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/parseQuery.h>
 #include <Parsers/queryToString.h>
 #include <Common/escapeForFileName.h>
+#include <Common/parseRemoteDescription.h>
+#include <Databases/DatabaseFactory.h>
 #include <Databases/PostgreSQL/fetchPostgreSQLTableStructure.h>
 #include <Common/quoteString.h>
 #include <Common/filesystemHelpers.h>
@@ -478,6 +482,83 @@ ASTPtr DatabasePostgreSQL::getColumnDeclaration(const DataTypePtr & data_type) c
     return std::make_shared<ASTIdentifier>(data_type->getName());
 }
 
+void registerDatabasePostgreSQL(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+        ASTs & engine_args = engine->arguments->children;
+        const String & engine_name = engine_define->engine->name;
+
+        if (!engine->arguments)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Engine `{}` must have arguments", engine_name);
+
+        auto use_table_cache = false;
+        StoragePostgreSQL::Configuration configuration;
+
+        if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, args.context))
+        {
+            configuration = StoragePostgreSQL::processNamedCollectionResult(*named_collection, args.context, false);
+            use_table_cache = named_collection->getOrDefault<UInt64>("use_table_cache", 0);
+        }
+        else
+        {
+            if (engine_args.size() < 4 || engine_args.size() > 6)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                                "PostgreSQL Database require `host:port`, `database_name`, `username`, `password`"
+                                "[, `schema` = "", `use_table_cache` = 0");
+
+            for (auto & engine_arg : engine_args)
+                engine_arg = evaluateConstantExpressionOrIdentifierAsLiteral(engine_arg, args.context);
+
+            const auto & host_port = safeGetLiteralValue<String>(engine_args[0], engine_name);
+            size_t max_addresses = args.context->getSettingsRef().glob_expansion_max_elements;
+
+            configuration.addresses = parseRemoteDescriptionForExternalDatabase(host_port, max_addresses, 5432);
+            configuration.database = safeGetLiteralValue<String>(engine_args[1], engine_name);
+            configuration.username = safeGetLiteralValue<String>(engine_args[2], engine_name);
+            configuration.password = safeGetLiteralValue<String>(engine_args[3], engine_name);
+
+            bool is_deprecated_syntax = false;
+            if (engine_args.size() >= 5)
+            {
+                auto arg_value = engine_args[4]->as<ASTLiteral>()->value;
+                if (arg_value.getType() == Field::Types::Which::String)
+                {
+                    configuration.schema = safeGetLiteralValue<String>(engine_args[4], engine_name);
+                }
+                else
+                {
+                    use_table_cache = safeGetLiteralValue<UInt8>(engine_args[4], engine_name);
+                    LOG_WARNING(&Poco::Logger::get("DatabaseFactory"), "A deprecated syntax of PostgreSQL database engine is used");
+                    is_deprecated_syntax = true;
+                }
+            }
+
+            if (!is_deprecated_syntax && engine_args.size() >= 6)
+                use_table_cache = safeGetLiteralValue<UInt8>(engine_args[5], engine_name);
+        }
+
+        const auto & settings = args.context->getSettingsRef();
+        auto pool = std::make_shared<postgres::PoolWithFailover>(
+            configuration,
+            settings.postgresql_connection_pool_size,
+            settings.postgresql_connection_pool_wait_timeout,
+            POSTGRESQL_POOL_WITH_FAILOVER_DEFAULT_MAX_TRIES,
+            settings.postgresql_connection_pool_auto_close_connection);
+
+        return std::make_shared<DatabasePostgreSQL>(
+            args.context,
+            args.metadata_path,
+            engine_define,
+            args.database_name,
+            configuration,
+            pool,
+            use_table_cache);
+    };
+    factory.registerDatabase("PostgreSQL", create_fn);
+}
 }
 
 #endif
diff --git a/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp b/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp
index dec3f1ffe5a..469ca52890a 100644
--- a/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp
+++ b/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.cpp
@@ -25,6 +25,7 @@ namespace ErrorCodes
 {
     extern const int UNKNOWN_TABLE;
     extern const int BAD_ARGUMENTS;
+    extern const int LOGICAL_ERROR;
 }
 
 
@@ -158,6 +159,15 @@ static DataTypePtr convertPostgreSQLDataType(String & type, Fn<void()> auto && r
     return res;
 }
 
+/// Check if PostgreSQL relation is empty.
+/// postgres_table must be already quoted + schema-qualified.
+template <typename T>
+bool isTableEmpty(T & tx, const String & postgres_table)
+{
+    auto query = fmt::format("SELECT NOT EXISTS (SELECT * FROM {} LIMIT 1);", postgres_table);
+    pqxx::result result{tx.exec(query)};
+    return result[0][0].as<bool>();
+}
 
 template<typename T>
 PostgreSQLTableStructure::ColumnsInfoPtr readNamesAndTypesList(
@@ -186,20 +196,24 @@ PostgreSQLTableStructure::ColumnsInfoPtr readNamesAndTypesList(
             }
             else
             {
-                std::tuple<std::string, std::string, std::string, uint16_t, std::string, std::string> row;
+                std::tuple<std::string, std::string, std::string, uint16_t, std::string, std::string, std::string> row;
                 while (stream >> row)
                 {
-                    auto data_type = convertPostgreSQLDataType(
+                    const auto column_name = std::get<0>(row);
+                    const auto data_type = convertPostgreSQLDataType(
                         std::get<1>(row), recheck_array,
                         use_nulls && (std::get<2>(row) == /* not nullable */"f"),
                         std::get<3>(row));
 
-                    columns.push_back(NameAndTypePair(std::get<0>(row), data_type));
+                    columns.push_back(NameAndTypePair(column_name, data_type));
+                    auto attgenerated = std::get<6>(row);
 
-                    attributes.emplace_back(
-                    PostgreSQLTableStructure::PGAttribute{
-                        .atttypid = parse<int>(std::get<4>(row)),
-                        .atttypmod = parse<int>(std::get<5>(row)),
+                    attributes.emplace(
+                        column_name,
+                        PostgreSQLTableStructure::PGAttribute{
+                            .atttypid = parse<int>(std::get<4>(row)),
+                            .atttypmod = parse<int>(std::get<5>(row)),
+                            .attgenerated = attgenerated.empty() ? char{} : char(attgenerated[0])
                     });
 
                     ++i;
@@ -213,10 +227,37 @@ PostgreSQLTableStructure::ColumnsInfoPtr readNamesAndTypesList(
         {
             const auto & name_and_type = columns[i];
 
-            /// All rows must contain the same number of dimensions, so limit 1 is ok. If number of dimensions in all rows is not the same -
+            /// If the relation is empty, then array_ndims returns NULL.
+            /// ClickHouse cannot support this use case.
+            if (isTableEmpty(tx, postgres_table))
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "PostgreSQL relation containing arrays cannot be empty: {}", postgres_table);
+
+            /// All rows must contain the same number of dimensions.
+            /// 1 is ok. If number of dimensions in all rows is not the same -
             /// such arrays are not able to be used as ClickHouse Array at all.
-            pqxx::result result{tx.exec(fmt::format("SELECT array_ndims({}) FROM {} LIMIT 1", name_and_type.name, postgres_table))};
-            auto dimensions = result[0][0].as<int>();
+            ///
+            /// For empty arrays, array_ndims([]) will return NULL.
+            auto postgres_column = doubleQuoteString(name_and_type.name);
+            pqxx::result result{tx.exec(
+                fmt::format("SELECT {} IS NULL, array_ndims({}) FROM {} LIMIT 1;", postgres_column, postgres_column, postgres_table))};
+
+            /// Nullable(Array) is not supported.
+            auto is_null_array = result[0][0].as<bool>();
+            if (is_null_array)
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "PostgreSQL array cannot be NULL: {}.{}", postgres_table, postgres_column);
+
+            /// Cannot infer dimension of empty arrays.
+            auto is_empty_array = result[0][1].is_null();
+            if (is_empty_array)
+            {
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "PostgreSQL cannot infer dimensions of an empty array: {}.{}",
+                    postgres_table,
+                    postgres_column);
+            }
+
+            int dimensions = result[0][1].as<int>();
 
             /// It is always 1d array if it is in recheck.
             DataTypePtr type = assert_cast<const DataTypeArray *>(name_and_type.type.get())->getNestedType();
@@ -253,14 +294,19 @@ PostgreSQLTableStructure fetchPostgreSQLTableStructure(
     PostgreSQLTableStructure table;
 
     auto where = fmt::format("relname = {}", quoteString(postgres_table));
-    if (postgres_schema.empty())
-        where += " AND relnamespace = (SELECT oid FROM pg_namespace WHERE nspname = 'public')";
-    else
-        where += fmt::format(" AND relnamespace = (SELECT oid FROM pg_namespace WHERE nspname = {})", quoteString(postgres_schema));
+
+    where += postgres_schema.empty()
+        ? " AND relnamespace = (SELECT oid FROM pg_namespace WHERE nspname = 'public')"
+        : fmt::format(" AND relnamespace = (SELECT oid FROM pg_namespace WHERE nspname = {})", quoteString(postgres_schema));
 
     std::string query = fmt::format(
-           "SELECT attname AS name, format_type(atttypid, atttypmod) AS type, "
-           "attnotnull AS not_null, attndims AS dims, atttypid as type_id, atttypmod as type_modifier "
+           "SELECT attname AS name, " /// column name
+           "format_type(atttypid, atttypmod) AS type, " /// data type
+           "attnotnull AS not_null, " /// is nullable
+           "attndims AS dims, " /// array dimensions
+           "atttypid as type_id, "
+           "atttypmod as type_modifier, "
+           "attgenerated as generated " /// if column has GENERATED
            "FROM pg_attribute "
            "WHERE attrelid = (SELECT oid FROM pg_class WHERE {}) "
            "AND NOT attisdropped AND attnum > 0 "
@@ -272,11 +318,44 @@ PostgreSQLTableStructure fetchPostgreSQLTableStructure(
     if (!table.physical_columns)
         throw Exception(ErrorCodes::UNKNOWN_TABLE, "PostgreSQL table {} does not exist", postgres_table_with_schema);
 
+    for (const auto & column : table.physical_columns->columns)
+    {
+        table.physical_columns->names.push_back(column.name);
+    }
+
+    bool check_generated = table.physical_columns->attributes.end() != std::find_if(
+        table.physical_columns->attributes.begin(),
+        table.physical_columns->attributes.end(),
+        [](const auto & attr){ return attr.second.attgenerated == 's'; });
+
+    if (check_generated)
+    {
+        std::string attrdef_query = fmt::format(
+            "SELECT adnum, pg_get_expr(adbin, adrelid) as generated_expression "
+            "FROM pg_attrdef "
+            "WHERE adrelid = (SELECT oid FROM pg_class WHERE {});", where);
+
+        pqxx::result result{tx.exec(attrdef_query)};
+        for (const auto row : result)
+        {
+            size_t adnum = row[0].as<int>();
+            if (!adnum || adnum > table.physical_columns->names.size())
+            {
+                throw Exception(ErrorCodes::LOGICAL_ERROR,
+                                "Received adnum {}, but currently fetched columns list has {} columns",
+                                adnum, table.physical_columns->attributes.size());
+            }
+            const auto column_name = table.physical_columns->names[adnum - 1];
+            table.physical_columns->attributes.at(column_name).attr_def = row[1].as<std::string>();
+        }
+    }
+
     if (with_primary_key)
     {
         /// wiki.postgresql.org/wiki/Retrieve_primary_key_columns
         query = fmt::format(
-                "SELECT a.attname, format_type(a.atttypid, a.atttypmod) AS data_type "
+                "SELECT a.attname, " /// column name
+                "format_type(a.atttypid, a.atttypmod) AS data_type " /// data type
                 "FROM pg_index i "
                 "JOIN pg_attribute a ON a.attrelid = i.indrelid "
                 "AND a.attnum = ANY(i.indkey) "
diff --git a/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.h b/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.h
index 7cd21d353a2..81bf7b278fc 100644
--- a/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.h
+++ b/src/Databases/PostgreSQL/fetchPostgreSQLTableStructure.h
@@ -16,13 +16,17 @@ struct PostgreSQLTableStructure
     {
         Int32 atttypid;
         Int32 atttypmod;
+        bool atthasdef;
+        char attgenerated;
+        std::string attr_def;
     };
-    using Attributes = std::vector<PGAttribute>;
+    using Attributes = std::unordered_map<std::string, PGAttribute>;
 
     struct ColumnsInfo
     {
         NamesAndTypesList columns;
         Attributes attributes;
+        std::vector<std::string> names;
         ColumnsInfo(NamesAndTypesList && columns_, Attributes && attributes_) : columns(columns_), attributes(attributes_) {}
     };
     using ColumnsInfoPtr = std::shared_ptr<ColumnsInfo>;
diff --git a/src/Databases/SQLite/DatabaseSQLite.cpp b/src/Databases/SQLite/DatabaseSQLite.cpp
index d031fd8e420..605a354bd7e 100644
--- a/src/Databases/SQLite/DatabaseSQLite.cpp
+++ b/src/Databases/SQLite/DatabaseSQLite.cpp
@@ -5,11 +5,11 @@
 #include <Common/logger_useful.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <Databases/DatabaseFactory.h>
 #include <Databases/SQLite/fetchSQLiteTableStructure.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTColumnDeclaration.h>
 #include <Parsers/ASTFunction.h>
-#include <Interpreters/Context.h>
 #include <Storages/StorageSQLite.h>
 #include <Databases/SQLite/SQLiteUtils.h>
 
@@ -21,6 +21,7 @@ namespace ErrorCodes
 {
     extern const int SQLITE_ENGINE_ERROR;
     extern const int UNKNOWN_TABLE;
+    extern const int BAD_ARGUMENTS;
 }
 
 DatabaseSQLite::DatabaseSQLite(
@@ -201,6 +202,24 @@ ASTPtr DatabaseSQLite::getCreateTableQueryImpl(const String & table_name, Contex
     return create_table_query;
 }
 
+void registerDatabaseSQLite(DatabaseFactory & factory)
+{
+    auto create_fn = [](const DatabaseFactory::Arguments & args)
+    {
+        auto * engine_define = args.create_query.storage;
+        const ASTFunction * engine = engine_define->engine;
+
+        if (!engine->arguments || engine->arguments->children.size() != 1)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "SQLite database requires 1 argument: database path");
+
+        const auto & arguments = engine->arguments->children;
+
+        String database_path = safeGetLiteralValue<String>(arguments[0], "SQLite");
+
+        return std::make_shared<DatabaseSQLite>(args.context, engine_define, args.create_query.attach, database_path);
+    };
+    factory.registerDatabase("SQLite", create_fn);
+}
 }
 
 #endif
diff --git a/src/Databases/TablesDependencyGraph.h b/src/Databases/TablesDependencyGraph.h
index e71d5ecc5fc..50be3bbf969 100644
--- a/src/Databases/TablesDependencyGraph.h
+++ b/src/Databases/TablesDependencyGraph.h
@@ -60,7 +60,7 @@ public:
     /// Removes all dependencies of "table_id", returns those dependencies.
     std::vector<StorageID> removeDependencies(const StorageID & table_id, bool remove_isolated_tables = false);
 
-    /// Removes a table from the graph and removes all references to in from the graph (both from its dependencies and dependents).
+    /// Removes a table from the graph and removes all references to it from the graph (both from its dependencies and dependents).
     bool removeTable(const StorageID & table_id);
 
     /// Removes tables from the graph by a specified filter.
diff --git a/src/Databases/TablesLoader.h b/src/Databases/TablesLoader.h
index 3a7f8721432..038aa35895f 100644
--- a/src/Databases/TablesLoader.h
+++ b/src/Databases/TablesLoader.h
@@ -82,8 +82,6 @@ private:
 
     void buildDependencyGraph();
     void removeUnresolvableDependencies();
-    void loadTablesInTopologicalOrder();
-    void startLoadingTables(ContextMutablePtr load_context, const std::vector<StorageID> & tables_to_load, size_t level);
 };
 
 }
diff --git a/src/Databases/registerDatabases.cpp b/src/Databases/registerDatabases.cpp
new file mode 100644
index 00000000000..4f7c229bdf4
--- /dev/null
+++ b/src/Databases/registerDatabases.cpp
@@ -0,0 +1,72 @@
+#include <Databases/DatabaseFactory.h>
+#include <Databases/registerDatabases.h>
+
+
+namespace DB
+{
+
+void registerDatabaseAtomic(DatabaseFactory & factory);
+void registerDatabaseOrdinary(DatabaseFactory & factory);
+void registerDatabaseDictionary(DatabaseFactory & factory);
+void registerDatabaseMemory(DatabaseFactory & factory);
+void registerDatabaseLazy(DatabaseFactory & factory);
+void registerDatabaseFilesystem(DatabaseFactory & factory);
+void registerDatabaseReplicated(DatabaseFactory & factory);
+
+#if USE_MYSQL
+void registerDatabaseMySQL(DatabaseFactory & factory);
+void registerDatabaseMaterializedMySQL(DatabaseFactory & factory);
+#endif
+
+#if USE_LIBPQXX
+void registerDatabasePostgreSQL(DatabaseFactory & factory);
+
+void registerDatabaseMaterializedPostgreSQL(DatabaseFactory & factory);
+#endif
+
+#if USE_SQLITE
+void registerDatabaseSQLite(DatabaseFactory & factory);
+#endif
+
+#if USE_AWS_S3
+void registerDatabaseS3(DatabaseFactory & factory);
+#endif
+
+#if USE_HDFS
+void registerDatabaseHDFS(DatabaseFactory & factory);
+#endif
+
+void registerDatabases()
+{
+    auto & factory = DatabaseFactory::instance();
+    registerDatabaseAtomic(factory);
+    registerDatabaseOrdinary(factory);
+    registerDatabaseDictionary(factory);
+    registerDatabaseMemory(factory);
+    registerDatabaseLazy(factory);
+    registerDatabaseFilesystem(factory);
+    registerDatabaseReplicated(factory);
+
+#if USE_MYSQL
+    registerDatabaseMySQL(factory);
+    registerDatabaseMaterializedMySQL(factory);
+#endif
+
+#if USE_LIBPQXX
+    registerDatabasePostgreSQL(factory);
+    registerDatabaseMaterializedPostgreSQL(factory);
+#endif
+
+#if USE_SQLITE
+    registerDatabaseSQLite(factory);
+#endif
+
+#if USE_AWS_S3
+    registerDatabaseS3(factory);
+#endif
+
+#if USE_HDFS
+    registerDatabaseHDFS(factory);
+#endif
+}
+}
diff --git a/src/Databases/registerDatabases.h b/src/Databases/registerDatabases.h
new file mode 100644
index 00000000000..dbf1bbb6e64
--- /dev/null
+++ b/src/Databases/registerDatabases.h
@@ -0,0 +1,6 @@
+#pragma once
+
+namespace DB
+{
+void registerDatabases();
+}
diff --git a/src/Dictionaries/DictionaryFactory.cpp b/src/Dictionaries/DictionaryFactory.cpp
index c3102632167..f6102d7c657 100644
--- a/src/Dictionaries/DictionaryFactory.cpp
+++ b/src/Dictionaries/DictionaryFactory.cpp
@@ -69,12 +69,6 @@ DictionaryPtr DictionaryFactory::create(
         layout_type);
 }
 
-DictionaryPtr DictionaryFactory::create(const std::string & name, const ASTCreateQuery & ast, ContextPtr global_context) const
-{
-    auto configuration = getDictionaryConfigurationFromAST(ast, global_context);
-    return DictionaryFactory::create(name, *configuration, "dictionary", global_context, true);
-}
-
 bool DictionaryFactory::isComplex(const std::string & layout_type) const
 {
     auto it = registered_layouts.find(layout_type);
diff --git a/src/Dictionaries/DictionaryFactory.h b/src/Dictionaries/DictionaryFactory.h
index 35097a5ed24..2834451df81 100644
--- a/src/Dictionaries/DictionaryFactory.h
+++ b/src/Dictionaries/DictionaryFactory.h
@@ -39,11 +39,6 @@ public:
         ContextPtr global_context,
         bool created_from_ddl) const;
 
-    /// Create dictionary from DDL-query
-    DictionaryPtr create(const std::string & name,
-        const ASTCreateQuery & ast,
-        ContextPtr global_context) const;
-
     using LayoutCreateFunction = std::function<DictionaryPtr(
         const std::string & name,
         const DictionaryStructure & dict_struct,
diff --git a/src/Dictionaries/DictionaryStructure.cpp b/src/Dictionaries/DictionaryStructure.cpp
index 76cd36bf76a..0b6bdea60a3 100644
--- a/src/Dictionaries/DictionaryStructure.cpp
+++ b/src/Dictionaries/DictionaryStructure.cpp
@@ -37,7 +37,7 @@ DictionaryTypedSpecialAttribute makeDictionaryTypedSpecialAttribute(
     auto expression = config.getString(config_prefix + ".expression", "");
 
     if (name.empty() && !expression.empty())
-        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Element {}.name is empty");
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Element {}.name is empty", config_prefix);
 
     const auto type_name = config.getString(config_prefix + ".type", default_type);
     return DictionaryTypedSpecialAttribute{std::move(name), std::move(expression), DataTypeFactory::instance().get(type_name)};
diff --git a/src/Dictionaries/Embedded/GeoDictionariesLoader.cpp b/src/Dictionaries/Embedded/GeoDictionariesLoader.cpp
index 93612491b20..bfbbf774148 100644
--- a/src/Dictionaries/Embedded/GeoDictionariesLoader.cpp
+++ b/src/Dictionaries/Embedded/GeoDictionariesLoader.cpp
@@ -4,6 +4,9 @@
 #include "GeodataProviders/HierarchiesProvider.h"
 #include "GeodataProviders/NamesProvider.h"
 
+namespace DB
+{
+
 std::unique_ptr<RegionsHierarchies> GeoDictionariesLoader::reloadRegionsHierarchies(const Poco::Util::AbstractConfiguration & config)
 {
     static constexpr auto config_key = "path_to_regions_hierarchy_file";
@@ -27,3 +30,5 @@ std::unique_ptr<RegionsNames> GeoDictionariesLoader::reloadRegionsNames(const Po
     auto data_provider = std::make_unique<RegionsNamesDataProvider>(directory);
     return std::make_unique<RegionsNames>(std::move(data_provider));
 }
+
+}
diff --git a/src/Dictionaries/Embedded/GeoDictionariesLoader.h b/src/Dictionaries/Embedded/GeoDictionariesLoader.h
index d09e69cf561..f795456985e 100644
--- a/src/Dictionaries/Embedded/GeoDictionariesLoader.h
+++ b/src/Dictionaries/Embedded/GeoDictionariesLoader.h
@@ -6,6 +6,9 @@
 
 #include <Poco/Util/AbstractConfiguration.h>
 
+namespace DB
+{
+
 // Default implementation of geo dictionaries loader used by native server application
 class GeoDictionariesLoader
 {
@@ -13,3 +16,5 @@ public:
     static std::unique_ptr<RegionsHierarchies> reloadRegionsHierarchies(const Poco::Util::AbstractConfiguration & config);
     static std::unique_ptr<RegionsNames> reloadRegionsNames(const Poco::Util::AbstractConfiguration & config);
 };
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/Entries.h b/src/Dictionaries/Embedded/GeodataProviders/Entries.h
index 942c2f5adbc..6b27c5ae19e 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/Entries.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/Entries.h
@@ -3,6 +3,9 @@
 #include <string>
 #include "Types.h"
 
+namespace DB
+{
+
 struct RegionEntry
 {
     RegionID id;
@@ -17,3 +20,5 @@ struct RegionNameEntry
     RegionID id;
     std::string name;
 };
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.cpp b/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.cpp
index 210459da0be..5d8781d6f23 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.cpp
+++ b/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.cpp
@@ -9,6 +9,9 @@
 
 namespace fs = std::filesystem;
 
+namespace DB
+{
+
 bool RegionsHierarchyDataSource::isModified() const
 {
     return updates_tracker.isModified();
@@ -17,7 +20,7 @@ bool RegionsHierarchyDataSource::isModified() const
 IRegionsHierarchyReaderPtr RegionsHierarchyDataSource::createReader()
 {
     updates_tracker.fixCurrentVersion();
-    auto file_reader = std::make_shared<DB::ReadBufferFromFile>(path);
+    auto file_reader = std::make_shared<ReadBufferFromFile>(path);
     return std::make_unique<RegionsHierarchyFormatReader>(std::move(file_reader));
 }
 
@@ -73,3 +76,5 @@ IRegionsHierarchyDataSourcePtr RegionsHierarchiesDataProvider::getHierarchySourc
 
     throw Poco::Exception("Regions hierarchy '" + name + "' not found");
 }
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.h b/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.h
index c2e36f59e1e..6ded62dbf83 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/HierarchiesProvider.h
@@ -5,6 +5,8 @@
 #include <unordered_map>
 #include <Common/FileUpdatesTracker.h>
 
+namespace DB
+{
 
 // Represents local file with regions hierarchy dump
 class RegionsHierarchyDataSource : public IRegionsHierarchyDataSource
@@ -50,3 +52,5 @@ public:
 private:
     void discoverFilesWithCustomHierarchies();
 };
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.cpp b/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.cpp
index 68bd6142416..d9ac19f4d67 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.cpp
+++ b/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.cpp
@@ -3,6 +3,8 @@
 #include <IO/ReadHelpers.h>
 #include <IO/WriteHelpers.h>
 
+namespace DB
+{
 
 bool RegionsHierarchyFormatReader::readNext(RegionEntry & entry)
 {
@@ -15,11 +17,11 @@ bool RegionsHierarchyFormatReader::readNext(RegionEntry & entry)
         Int32 read_parent_id = 0;
         Int8 read_type = 0;
 
-        DB::readIntText(read_region_id, *input);
-        DB::assertChar('\t', *input);
-        DB::readIntText(read_parent_id, *input);
-        DB::assertChar('\t', *input);
-        DB::readIntText(read_type, *input);
+        readIntText(read_region_id, *input);
+        assertChar('\t', *input);
+        readIntText(read_parent_id, *input);
+        assertChar('\t', *input);
+        readIntText(read_type, *input);
 
         /** Then there can be a newline (old version)
             *  or tab, the region's population, line feed (new version).
@@ -29,11 +31,11 @@ bool RegionsHierarchyFormatReader::readNext(RegionEntry & entry)
         {
             ++input->position();
             UInt64 population_big = 0;
-            DB::readIntText(population_big, *input);
+            readIntText(population_big, *input);
             population = population_big > std::numeric_limits<RegionPopulation>::max() ? std::numeric_limits<RegionPopulation>::max()
                                                                                        : static_cast<RegionPopulation>(population_big);
         }
-        DB::assertChar('\n', *input);
+        assertChar('\n', *input);
 
         if (read_region_id <= 0 || read_type < 0)
             continue;
@@ -55,3 +57,5 @@ bool RegionsHierarchyFormatReader::readNext(RegionEntry & entry)
 
     return false;
 }
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.h b/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.h
index 64f393ada62..ebd8fca4ff9 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/HierarchyFormatReader.h
@@ -3,15 +3,19 @@
 #include <IO/ReadBuffer.h>
 #include "IHierarchiesProvider.h"
 
+namespace DB
+{
 
 // Reads regions hierarchy in geoexport format
 class RegionsHierarchyFormatReader : public IRegionsHierarchyReader
 {
 private:
-    DB::ReadBufferPtr input;
+    ReadBufferPtr input;
 
 public:
-    explicit RegionsHierarchyFormatReader(DB::ReadBufferPtr input_) : input(std::move(input_)) {}
+    explicit RegionsHierarchyFormatReader(ReadBufferPtr input_) : input(std::move(input_)) {}
 
     bool readNext(RegionEntry & entry) override;
 };
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h b/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h
index f7d51135440..68ab0fdca2d 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/IHierarchiesProvider.h
@@ -5,6 +5,8 @@
 #include <vector>
 #include "Entries.h"
 
+namespace DB
+{
 
 // Iterates over all regions in data source
 class IRegionsHierarchyReader
@@ -46,3 +48,5 @@ public:
 };
 
 using IRegionsHierarchiesDataProviderPtr = std::shared_ptr<IRegionsHierarchiesDataProvider>;
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/INamesProvider.h b/src/Dictionaries/Embedded/GeodataProviders/INamesProvider.h
index 679c14d546b..6cd7d78f6d5 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/INamesProvider.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/INamesProvider.h
@@ -3,6 +3,8 @@
 #include <memory>
 #include "Entries.h"
 
+namespace DB
+{
 
 // Iterates over all name entries in data source
 class ILanguageRegionsNamesReader
@@ -49,3 +51,5 @@ public:
 };
 
 using IRegionsNamesDataProviderPtr = std::unique_ptr<IRegionsNamesDataProvider>;
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.cpp b/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.cpp
index 9d0c57f18eb..99216507c10 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.cpp
+++ b/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.cpp
@@ -2,6 +2,8 @@
 
 #include <IO/ReadHelpers.h>
 
+namespace DB
+{
 
 bool LanguageRegionsNamesFormatReader::readNext(RegionNameEntry & entry)
 {
@@ -10,10 +12,10 @@ bool LanguageRegionsNamesFormatReader::readNext(RegionNameEntry & entry)
         Int32 read_region_id;
         std::string region_name;
 
-        DB::readIntText(read_region_id, *input);
-        DB::assertChar('\t', *input);
-        DB::readString(region_name, *input);
-        DB::assertChar('\n', *input);
+        readIntText(read_region_id, *input);
+        assertChar('\t', *input);
+        readString(region_name, *input);
+        assertChar('\n', *input);
 
         if (read_region_id <= 0)
             continue;
@@ -25,3 +27,5 @@ bool LanguageRegionsNamesFormatReader::readNext(RegionNameEntry & entry)
 
     return false;
 }
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.h b/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.h
index 49d324d434e..50b2abd47c1 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/NamesFormatReader.h
@@ -3,15 +3,19 @@
 #include <IO/ReadBuffer.h>
 #include "INamesProvider.h"
 
+namespace DB
+{
 
 // Reads regions names list in geoexport format
 class LanguageRegionsNamesFormatReader : public ILanguageRegionsNamesReader
 {
 private:
-    DB::ReadBufferPtr input;
+    ReadBufferPtr input;
 
 public:
-    explicit LanguageRegionsNamesFormatReader(DB::ReadBufferPtr input_) : input(std::move(input_)) {}
+    explicit LanguageRegionsNamesFormatReader(ReadBufferPtr input_) : input(std::move(input_)) {}
 
     bool readNext(RegionNameEntry & entry) override;
 };
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.cpp b/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.cpp
index 5f79fda070f..e6a8d308e87 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.cpp
+++ b/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.cpp
@@ -6,6 +6,9 @@
 
 namespace fs = std::filesystem;
 
+namespace DB
+{
+
 bool LanguageRegionsNamesDataSource::isModified() const
 {
     return updates_tracker.isModified();
@@ -19,7 +22,7 @@ size_t LanguageRegionsNamesDataSource::estimateTotalSize() const
 ILanguageRegionsNamesReaderPtr LanguageRegionsNamesDataSource::createReader()
 {
     updates_tracker.fixCurrentVersion();
-    auto file_reader = std::make_shared<DB::ReadBufferFromFile>(path);
+    auto file_reader = std::make_shared<ReadBufferFromFile>(path);
     return std::make_unique<LanguageRegionsNamesFormatReader>(std::move(file_reader));
 }
 
@@ -51,3 +54,5 @@ std::string RegionsNamesDataProvider::getDataFilePath(const std::string & langua
 {
     return directory + "/regions_names_" + language + ".txt";
 }
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.h b/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.h
index 2d49cceab86..8ba1f33d2c4 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/NamesProvider.h
@@ -3,6 +3,8 @@
 #include <Common/FileUpdatesTracker.h>
 #include "INamesProvider.h"
 
+namespace DB
+{
 
 // Represents local file with list of regions ids / names
 class LanguageRegionsNamesDataSource : public ILanguageRegionsNamesDataSource
@@ -46,3 +48,5 @@ public:
 private:
     std::string getDataFilePath(const std::string & language) const;
 };
+
+}
diff --git a/src/Dictionaries/Embedded/GeodataProviders/Types.h b/src/Dictionaries/Embedded/GeodataProviders/Types.h
index e63f6bae716..0fd6a01051a 100644
--- a/src/Dictionaries/Embedded/GeodataProviders/Types.h
+++ b/src/Dictionaries/Embedded/GeodataProviders/Types.h
@@ -2,6 +2,8 @@
 
 #include <base/types.h>
 
+namespace DB
+{
 
 using RegionID = UInt32;
 using RegionDepth = UInt8;
@@ -16,3 +18,5 @@ enum class RegionType : Int8
     Area = 5,
     City = 6,
 };
+
+}
diff --git a/src/Dictionaries/Embedded/RegionsHierarchies.cpp b/src/Dictionaries/Embedded/RegionsHierarchies.cpp
index be828b8b281..c3c62bcc83c 100644
--- a/src/Dictionaries/Embedded/RegionsHierarchies.cpp
+++ b/src/Dictionaries/Embedded/RegionsHierarchies.cpp
@@ -3,6 +3,8 @@
 #include <Poco/DirectoryIterator.h>
 #include <Common/logger_useful.h>
 
+namespace DB
+{
 
 RegionsHierarchies::RegionsHierarchies(IRegionsHierarchiesDataProviderPtr data_provider)
 {
@@ -19,3 +21,5 @@ RegionsHierarchies::RegionsHierarchies(IRegionsHierarchiesDataProviderPtr data_p
 
     reload();
 }
+
+}
diff --git a/src/Dictionaries/Embedded/RegionsHierarchies.h b/src/Dictionaries/Embedded/RegionsHierarchies.h
index 925b7b490ff..996c1177b6e 100644
--- a/src/Dictionaries/Embedded/RegionsHierarchies.h
+++ b/src/Dictionaries/Embedded/RegionsHierarchies.h
@@ -5,6 +5,8 @@
 #include "GeodataProviders/IHierarchiesProvider.h"
 #include "RegionsHierarchy.h"
 
+namespace DB
+{
 
 /** Contains several hierarchies of regions.
   * Used to support several different perspectives on the ownership of regions by countries.
@@ -37,3 +39,5 @@ public:
         return it->second;
     }
 };
+
+}
diff --git a/src/Dictionaries/Embedded/RegionsHierarchy.cpp b/src/Dictionaries/Embedded/RegionsHierarchy.cpp
index c266bf7efb8..23f4c250a23 100644
--- a/src/Dictionaries/Embedded/RegionsHierarchy.cpp
+++ b/src/Dictionaries/Embedded/RegionsHierarchy.cpp
@@ -12,7 +12,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int INCORRECT_DATA;
-}
+    extern const int LOGICAL_ERROR;
 }
 
 
@@ -54,9 +54,8 @@ void RegionsHierarchy::reload()
         if (region_entry.id > max_region_id)
         {
             if (region_entry.id > max_size)
-                throw DB::Exception(DB::ErrorCodes::INCORRECT_DATA,
-                    "Region id is too large: {}, should be not more than {}",
-                    DB::toString(region_entry.id), DB::toString(max_size));
+                throw Exception(
+                    ErrorCodes::INCORRECT_DATA, "Region id is too large: {}, should be not more than {}", region_entry.id, max_size);
 
             max_region_id = region_entry.id;
 
@@ -112,16 +111,18 @@ void RegionsHierarchy::reload()
             ++depth;
 
             if (depth == std::numeric_limits<RegionDepth>::max())
-                throw Poco::Exception(
-                    "Logical error in regions hierarchy: region " + DB::toString(current) + " possible is inside infinite loop");
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR, "Logical error in regions hierarchy: region {} possible is inside infinite loop", current);
 
             current = new_parents[current];
             if (current == 0)
                 break;
 
             if (current > max_region_id)
-                throw Poco::Exception(
-                    "Logical error in regions hierarchy: region " + DB::toString(current) + " (specified as parent) doesn't exist");
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR,
+                    "Logical error in regions hierarchy: region {} (specified as parent) doesn't exist",
+                    current);
 
             if (types[current] == RegionType::City)
                 new_city[i] = current;
@@ -156,3 +157,5 @@ void RegionsHierarchy::reload()
     populations.swap(new_populations);
     depths.swap(new_depths);
 }
+
+}
diff --git a/src/Dictionaries/Embedded/RegionsHierarchy.h b/src/Dictionaries/Embedded/RegionsHierarchy.h
index 508bca0d1e1..5d9aacb9512 100644
--- a/src/Dictionaries/Embedded/RegionsHierarchy.h
+++ b/src/Dictionaries/Embedded/RegionsHierarchy.h
@@ -6,6 +6,8 @@
 #include "GeodataProviders/IHierarchiesProvider.h"
 #include <Core/Defines.h>
 
+namespace DB
+{
 
 class IRegionsHierarchyDataProvider;
 
@@ -129,3 +131,5 @@ public:
         return populations[region];
     }
 };
+
+}
diff --git a/src/Dictionaries/Embedded/RegionsNames.cpp b/src/Dictionaries/Embedded/RegionsNames.cpp
index 93ca9e6dbc9..847dfe99b10 100644
--- a/src/Dictionaries/Embedded/RegionsNames.cpp
+++ b/src/Dictionaries/Embedded/RegionsNames.cpp
@@ -10,12 +10,12 @@
 
 namespace DB
 {
+
 namespace ErrorCodes
 {
     extern const int INCORRECT_DATA;
+    extern const int LOGICAL_ERROR;
 }
-}
-
 
 RegionsNames::RegionsNames(IRegionsNamesDataProviderPtr data_provider)
 {
@@ -30,7 +30,7 @@ RegionsNames::RegionsNames(IRegionsNamesDataProviderPtr data_provider)
 
 std::string RegionsNames::dumpSupportedLanguagesNames()
 {
-    DB::WriteBufferFromOwnString out;
+    WriteBufferFromOwnString out;
     for (size_t i = 0; i < total_languages; ++i)
     {
         if (i > 0)
@@ -74,7 +74,8 @@ void RegionsNames::reload()
             size_t old_size = new_chars.size();
 
             if (new_chars.capacity() < old_size + name_entry.name.length() + 1)
-                throw Poco::Exception("Logical error. Maybe size estimate of " + names_source->getSourceName() + " is wrong.");
+                throw Exception(
+                    ErrorCodes::LOGICAL_ERROR, "Logical error. Maybe size estimate of {} is wrong", names_source->getSourceName());
 
             new_chars.resize(old_size + name_entry.name.length() + 1);
             memcpy(new_chars.data() + old_size, name_entry.name.c_str(), name_entry.name.length() + 1);
@@ -84,9 +85,8 @@ void RegionsNames::reload()
                 max_region_id = name_entry.id;
 
                 if (name_entry.id > max_size)
-                    throw DB::Exception(DB::ErrorCodes::INCORRECT_DATA,
-                        "Region id is too large: {}, should be not more than {}",
-                        DB::toString(name_entry.id), DB::toString(max_size));
+                    throw Exception(
+                        ErrorCodes::INCORRECT_DATA, "Region id is too large: {}, should be not more than {}", name_entry.id, max_size);
             }
 
             while (name_entry.id >= new_names_refs.size())
@@ -102,3 +102,5 @@ void RegionsNames::reload()
     for (size_t language_id = 0; language_id < total_languages; ++language_id)
         names_refs[language_id].resize(max_region_id + 1, StringRef("", 0));
 }
+
+}
diff --git a/src/Dictionaries/Embedded/RegionsNames.h b/src/Dictionaries/Embedded/RegionsNames.h
index 1e0ea3f0923..0053c74745a 100644
--- a/src/Dictionaries/Embedded/RegionsNames.h
+++ b/src/Dictionaries/Embedded/RegionsNames.h
@@ -7,6 +7,8 @@
 #include <base/types.h>
 #include "GeodataProviders/INamesProvider.h"
 
+namespace DB
+{
 
 /** A class that allows you to recognize by region id its text name in one of the supported languages.
   *
@@ -111,3 +113,5 @@ public:
 
     void reload();
 };
+
+}
diff --git a/src/Dictionaries/HTTPDictionarySource.cpp b/src/Dictionaries/HTTPDictionarySource.cpp
index c12f4fedf3f..689593a969e 100644
--- a/src/Dictionaries/HTTPDictionarySource.cpp
+++ b/src/Dictionaries/HTTPDictionarySource.cpp
@@ -38,7 +38,7 @@ HTTPDictionarySource::HTTPDictionarySource(
     , configuration(configuration_)
     , sample_block(sample_block_)
     , context(context_)
-    , timeouts(ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), {context->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0}))
+    , timeouts(ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), context->getServerSettings().keep_alive_timeout))
 {
     credentials.setUsername(credentials_.getUsername());
     credentials.setPassword(credentials_.getPassword());
@@ -51,7 +51,7 @@ HTTPDictionarySource::HTTPDictionarySource(const HTTPDictionarySource & other)
     , configuration(other.configuration)
     , sample_block(other.sample_block)
     , context(Context::createCopy(other.context))
-    , timeouts(ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), {context->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0}))
+    , timeouts(ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), context->getServerSettings().keep_alive_timeout))
 {
     credentials.setUsername(other.credentials.getUsername());
     credentials.setPassword(other.credentials.getPassword());
diff --git a/src/Dictionaries/HashedArrayDictionary.cpp b/src/Dictionaries/HashedArrayDictionary.cpp
index 21016025d96..4c9ff8abe80 100644
--- a/src/Dictionaries/HashedArrayDictionary.cpp
+++ b/src/Dictionaries/HashedArrayDictionary.cpp
@@ -20,17 +20,19 @@ namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
     extern const int DICTIONARY_IS_EMPTY;
+    extern const int LOGICAL_ERROR;
     extern const int UNSUPPORTED_METHOD;
 }
 
-template <DictionaryKeyType dictionary_key_type>
-HashedArrayDictionary<dictionary_key_type>::HashedArrayDictionary(
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+HashedArrayDictionary<dictionary_key_type, sharded>::HashedArrayDictionary(
     const StorageID & dict_id_,
     const DictionaryStructure & dict_struct_,
     DictionarySourcePtr source_ptr_,
     const HashedArrayDictionaryStorageConfiguration & configuration_,
     BlockPtr update_field_loaded_block_)
     : IDictionary(dict_id_)
+    , log(&Poco::Logger::get("HashedArrayDictionary"))
     , dict_struct(dict_struct_)
     , source_ptr(std::move(source_ptr_))
     , configuration(configuration_)
@@ -42,8 +44,8 @@ HashedArrayDictionary<dictionary_key_type>::HashedArrayDictionary(
     calculateBytesAllocated();
 }
 
-template <DictionaryKeyType dictionary_key_type>
-ColumnPtr HashedArrayDictionary<dictionary_key_type>::getColumn(
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+ColumnPtr HashedArrayDictionary<dictionary_key_type, sharded>::getColumn(
     const std::string & attribute_name,
     const DataTypePtr & result_type,
     const Columns & key_columns,
@@ -67,8 +69,8 @@ ColumnPtr HashedArrayDictionary<dictionary_key_type>::getColumn(
     return getAttributeColumn(attribute, dictionary_attribute, keys_size, default_values_column, extractor);
 }
 
-template <DictionaryKeyType dictionary_key_type>
-Columns HashedArrayDictionary<dictionary_key_type>::getColumns(
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+Columns HashedArrayDictionary<dictionary_key_type, sharded>::getColumns(
     const Strings & attribute_names,
     const DataTypes & result_types,
     const Columns & key_columns,
@@ -83,7 +85,7 @@ Columns HashedArrayDictionary<dictionary_key_type>::getColumns(
 
     const size_t keys_size = extractor.getKeysSize();
 
-    PaddedPODArray<ssize_t> key_index_to_element_index;
+    KeyIndexToElementIndex key_index_to_element_index;
 
     /** Optimization for multiple attributes.
       * For each key save element index in key_index_to_element_index array.
@@ -92,7 +94,6 @@ Columns HashedArrayDictionary<dictionary_key_type>::getColumns(
       */
     if (attribute_names.size() > 1)
     {
-        const auto & key_attribute_container = key_attribute.container;
         size_t keys_found = 0;
 
         key_index_to_element_index.resize(keys_size);
@@ -100,15 +101,23 @@ Columns HashedArrayDictionary<dictionary_key_type>::getColumns(
         for (size_t key_index = 0; key_index < keys_size; ++key_index)
         {
             auto key = extractor.extractCurrentKey();
+            auto shard = getShard(key);
+            const auto & key_attribute_container = key_attribute.containers[shard];
 
             auto it = key_attribute_container.find(key);
             if (it == key_attribute_container.end())
             {
-                key_index_to_element_index[key_index] = -1;
+                if constexpr (sharded)
+                    key_index_to_element_index[key_index] = std::make_pair(-1, shard);
+                else
+                    key_index_to_element_index[key_index] = -1;
             }
             else
             {
-                key_index_to_element_index[key_index] = it->getMapped();
+                if constexpr (sharded)
+                    key_index_to_element_index[key_index] = std::make_pair(it->getMapped(), shard);
+                else
+                    key_index_to_element_index[key_index] = it->getMapped();
                 ++keys_found;
             }
 
@@ -147,8 +156,8 @@ Columns HashedArrayDictionary<dictionary_key_type>::getColumns(
     return result_columns;
 }
 
-template <DictionaryKeyType dictionary_key_type>
-ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type>::hasKeys(const Columns & key_columns, const DataTypes & key_types) const
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type, sharded>::hasKeys(const Columns & key_columns, const DataTypes & key_types) const
 {
     if (dictionary_key_type == DictionaryKeyType::Complex)
         dict_struct.validateKeyTypes(key_types);
@@ -166,8 +175,10 @@ ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type>::hasKeys(const Colum
     for (size_t requested_key_index = 0; requested_key_index < keys_size; ++requested_key_index)
     {
         auto requested_key = extractor.extractCurrentKey();
+        auto shard = getShard(requested_key);
+        const auto & key_attribute_container = key_attribute.containers[shard];
 
-        out[requested_key_index] = key_attribute.container.find(requested_key) != key_attribute.container.end();
+        out[requested_key_index] = key_attribute_container.find(requested_key) != key_attribute_container.end();
 
         keys_found += out[requested_key_index];
         extractor.rollbackCurrentKey();
@@ -179,8 +190,8 @@ ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type>::hasKeys(const Colum
     return result;
 }
 
-template <DictionaryKeyType dictionary_key_type>
-ColumnPtr HashedArrayDictionary<dictionary_key_type>::getHierarchy(ColumnPtr key_column [[maybe_unused]], const DataTypePtr &) const
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+ColumnPtr HashedArrayDictionary<dictionary_key_type, sharded>::getHierarchy(ColumnPtr key_column [[maybe_unused]], const DataTypePtr &) const
 {
     if constexpr (dictionary_key_type == DictionaryKeyType::Simple)
     {
@@ -197,16 +208,20 @@ ColumnPtr HashedArrayDictionary<dictionary_key_type>::getHierarchy(ColumnPtr key
         if (!dictionary_attribute.null_value.isNull())
             null_value = dictionary_attribute.null_value.get<UInt64>();
 
-        const auto & key_attribute_container = key_attribute.container;
-        const AttributeContainerType<UInt64> & parent_keys_container = std::get<AttributeContainerType<UInt64>>(hierarchical_attribute.container);
 
-        auto is_key_valid_func = [&](auto & key) { return key_attribute_container.find(key) != key_attribute_container.end(); };
+        auto is_key_valid_func = [&, this](auto & key)
+        {
+            const auto & key_attribute_container = key_attribute.containers[getShard(key)];
+            return key_attribute_container.find(key) != key_attribute_container.end();
+        };
 
         size_t keys_found = 0;
 
-        auto get_parent_func = [&](auto & hierarchy_key)
+        auto get_parent_func = [&, this](auto & hierarchy_key)
         {
             std::optional<UInt64> result;
+            auto shard = getShard(hierarchy_key);
+            const auto & key_attribute_container = key_attribute.containers[shard];
 
             auto it = key_attribute_container.find(hierarchy_key);
 
@@ -215,8 +230,9 @@ ColumnPtr HashedArrayDictionary<dictionary_key_type>::getHierarchy(ColumnPtr key
 
             size_t key_index = it->getMapped();
 
-            if (unlikely(hierarchical_attribute.is_index_null) && (*hierarchical_attribute.is_index_null)[key_index])
+            if (unlikely(hierarchical_attribute.is_index_null) && (*hierarchical_attribute.is_index_null)[shard][key_index])
                 return result;
+            const auto & parent_keys_container = std::get<AttributeContainerShardsType<UInt64>>(hierarchical_attribute.containers)[shard];
 
             UInt64 parent_key = parent_keys_container[key_index];
             if (null_value && *null_value == parent_key)
@@ -241,8 +257,8 @@ ColumnPtr HashedArrayDictionary<dictionary_key_type>::getHierarchy(ColumnPtr key
     }
 }
 
-template <DictionaryKeyType dictionary_key_type>
-ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type>::isInHierarchy(
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type, sharded>::isInHierarchy(
     ColumnPtr key_column [[maybe_unused]],
     ColumnPtr in_key_column [[maybe_unused]],
     const DataTypePtr &) const
@@ -265,16 +281,20 @@ ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type>::isInHierarchy(
         if (!dictionary_attribute.null_value.isNull())
             null_value = dictionary_attribute.null_value.get<UInt64>();
 
-        const auto & key_attribute_container = key_attribute.container;
-        const AttributeContainerType<UInt64> & parent_keys_container = std::get<AttributeContainerType<UInt64>>(hierarchical_attribute.container);
 
-        auto is_key_valid_func = [&](auto & key) { return key_attribute_container.find(key) != key_attribute_container.end(); };
+        auto is_key_valid_func = [&](auto & key)
+        {
+            const auto & key_attribute_container = key_attribute.containers[getShard(key)];
+            return key_attribute_container.find(key) != key_attribute_container.end();
+        };
 
         size_t keys_found = 0;
 
         auto get_parent_func = [&](auto & hierarchy_key)
         {
             std::optional<UInt64> result;
+            auto shard = getShard(hierarchy_key);
+            const auto & key_attribute_container = key_attribute.containers[shard];
 
             auto it = key_attribute_container.find(hierarchy_key);
 
@@ -283,9 +303,10 @@ ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type>::isInHierarchy(
 
             size_t key_index = it->getMapped();
 
-            if (unlikely(hierarchical_attribute.is_index_null) && (*hierarchical_attribute.is_index_null)[key_index])
+            if (unlikely(hierarchical_attribute.is_index_null) && (*hierarchical_attribute.is_index_null)[shard][key_index])
                 return result;
 
+            const auto & parent_keys_container = std::get<AttributeContainerShardsType<UInt64>>(hierarchical_attribute.containers)[shard];
             UInt64 parent_key = parent_keys_container[key_index];
             if (null_value && *null_value == parent_key)
                 return result;
@@ -309,8 +330,8 @@ ColumnUInt8::Ptr HashedArrayDictionary<dictionary_key_type>::isInHierarchy(
     }
 }
 
-template <DictionaryKeyType dictionary_key_type>
-DictionaryHierarchicalParentToChildIndexPtr HashedArrayDictionary<dictionary_key_type>::getHierarchicalIndex() const
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+DictionaryHierarchicalParentToChildIndexPtr HashedArrayDictionary<dictionary_key_type, sharded>::getHierarchicalIndex() const
 {
     if constexpr (dictionary_key_type == DictionaryKeyType::Simple)
     {
@@ -318,33 +339,35 @@ DictionaryHierarchicalParentToChildIndexPtr HashedArrayDictionary<dictionary_key
             return hierarchical_index;
 
         size_t hierarchical_attribute_index = *dict_struct.hierarchical_attribute_index;
-        const auto & hierarchical_attribute = attributes[hierarchical_attribute_index];
-        const AttributeContainerType<UInt64> & parent_keys_container = std::get<AttributeContainerType<UInt64>>(hierarchical_attribute.container);
-
-        const auto & key_attribute_container = key_attribute.container;
-
-        HashMap<size_t, UInt64> index_to_key;
-        index_to_key.reserve(key_attribute.container.size());
-
-        for (auto & [key, value] : key_attribute_container)
-            index_to_key[value] = key;
 
         DictionaryHierarchicalParentToChildIndex::ParentToChildIndex parent_to_child;
-        parent_to_child.reserve(index_to_key.size());
-
-        size_t parent_keys_container_size = parent_keys_container.size();
-        for (size_t i = 0; i < parent_keys_container_size; ++i)
+        for (size_t shard = 0; shard < configuration.shards; ++shard)
         {
-            if (unlikely(hierarchical_attribute.is_index_null) && (*hierarchical_attribute.is_index_null)[i])
-                continue;
+            HashMap<size_t, UInt64> index_to_key;
+            index_to_key.reserve(element_counts[shard]);
 
-            const auto * it = index_to_key.find(i);
-            if (it == index_to_key.end())
-                continue;
+            for (auto & [key, value] : key_attribute.containers[shard])
+                index_to_key[value] = key;
 
-            auto child_key = it->getMapped();
-            auto parent_key = parent_keys_container[i];
-            parent_to_child[parent_key].emplace_back(child_key);
+            parent_to_child.reserve(parent_to_child.size() + index_to_key.size());
+
+            const auto & hierarchical_attribute = attributes[hierarchical_attribute_index];
+            const auto & parent_keys_container = std::get<AttributeContainerShardsType<UInt64>>(hierarchical_attribute.containers)[shard];
+
+            size_t parent_keys_container_size = parent_keys_container.size();
+            for (size_t i = 0; i < parent_keys_container_size; ++i)
+            {
+                if (unlikely(hierarchical_attribute.is_index_null) && (*hierarchical_attribute.is_index_null)[shard][i])
+                    continue;
+
+                const auto * it = index_to_key.find(i);
+                if (it == index_to_key.end())
+                    continue;
+
+                auto child_key = it->getMapped();
+                auto parent_key = parent_keys_container[i];
+                parent_to_child[parent_key].emplace_back(child_key);
+            }
         }
 
         return std::make_shared<DictionaryHierarchicalParentToChildIndex>(parent_to_child);
@@ -355,8 +378,8 @@ DictionaryHierarchicalParentToChildIndexPtr HashedArrayDictionary<dictionary_key
     }
 }
 
-template <DictionaryKeyType dictionary_key_type>
-ColumnPtr HashedArrayDictionary<dictionary_key_type>::getDescendants(
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+ColumnPtr HashedArrayDictionary<dictionary_key_type, sharded>::getDescendants(
     ColumnPtr key_column [[maybe_unused]],
     const DataTypePtr &,
     size_t level [[maybe_unused]],
@@ -381,8 +404,8 @@ ColumnPtr HashedArrayDictionary<dictionary_key_type>::getDescendants(
     }
 }
 
-template <DictionaryKeyType dictionary_key_type>
-void HashedArrayDictionary<dictionary_key_type>::createAttributes()
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+void HashedArrayDictionary<dictionary_key_type, sharded>::createAttributes()
 {
     const auto size = dict_struct.attributes.size();
     attributes.reserve(size);
@@ -395,17 +418,24 @@ void HashedArrayDictionary<dictionary_key_type>::createAttributes()
             using AttributeType = typename Type::AttributeType;
             using ValueType = DictionaryValueType<AttributeType>;
 
-            auto is_index_null = dictionary_attribute.is_nullable ? std::make_optional<std::vector<bool>>() : std::optional<std::vector<bool>>{};
-            Attribute attribute{dictionary_attribute.underlying_type, AttributeContainerType<ValueType>(), std::move(is_index_null)};
+            auto is_index_null = dictionary_attribute.is_nullable ? std::make_optional<std::vector<typename Attribute::RowsMask>>(configuration.shards) : std::nullopt;
+            Attribute attribute{dictionary_attribute.underlying_type, AttributeContainerShardsType<ValueType>(configuration.shards), std::move(is_index_null)};
             attributes.emplace_back(std::move(attribute));
         };
 
         callOnDictionaryAttributeType(dictionary_attribute.underlying_type, type_call);
     }
+
+    key_attribute.containers.resize(configuration.shards);
+    element_counts.resize(configuration.shards);
+
+    string_arenas.resize(configuration.shards);
+    for (auto & arena : string_arenas)
+        arena = std::make_unique<Arena>();
 }
 
-template <DictionaryKeyType dictionary_key_type>
-void HashedArrayDictionary<dictionary_key_type>::updateData()
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+void HashedArrayDictionary<dictionary_key_type, sharded>::updateData()
 {
     if (!update_field_loaded_block || update_field_loaded_block->rows() == 0)
     {
@@ -445,13 +475,17 @@ void HashedArrayDictionary<dictionary_key_type>::updateData()
     if (update_field_loaded_block)
     {
         resize(update_field_loaded_block->rows());
-        blockToAttributes(*update_field_loaded_block.get());
+        DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
+        blockToAttributes(*update_field_loaded_block.get(), arena_holder, /* shard = */ 0);
     }
 }
 
-template <DictionaryKeyType dictionary_key_type>
-void HashedArrayDictionary<dictionary_key_type>::blockToAttributes(const Block & block [[maybe_unused]])
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+void HashedArrayDictionary<dictionary_key_type, sharded>::blockToAttributes(const Block & block, DictionaryKeysArenaHolder<dictionary_key_type> & arena_holder, size_t shard)
 {
+    if (unlikely(shard >= configuration.shards))
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Shard number {} is out of range: 0..{}", shard, configuration.shards - 1);
+
     size_t skip_keys_size_offset = dict_struct.getKeysSize();
 
     Columns key_columns;
@@ -461,7 +495,6 @@ void HashedArrayDictionary<dictionary_key_type>::blockToAttributes(const Block &
     for (size_t i = 0; i < skip_keys_size_offset; ++i)
         key_columns.emplace_back(block.safeGetByPosition(i).column);
 
-    DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
     DictionaryKeysExtractor<dictionary_key_type> keys_extractor(key_columns, arena_holder.getComplexKeyArena());
     const size_t keys_size = keys_extractor.getKeysSize();
 
@@ -471,18 +504,18 @@ void HashedArrayDictionary<dictionary_key_type>::blockToAttributes(const Block &
     {
         auto key = keys_extractor.extractCurrentKey();
 
-        auto it = key_attribute.container.find(key);
+        auto it = key_attribute.containers[shard].find(key);
 
-        if (it != key_attribute.container.end())
+        if (it != key_attribute.containers[shard].end())
         {
             keys_extractor.rollbackCurrentKey();
             continue;
         }
 
         if constexpr (std::is_same_v<KeyType, StringRef>)
-            key = copyStringInArena(string_arena, key);
+            key = copyStringInArena(*string_arenas[shard], key);
 
-        key_attribute.container.insert({key, element_count});
+        key_attribute.containers[shard].insert({key, element_counts[shard]});
 
         for (size_t attribute_index = 0; attribute_index < attributes.size(); ++attribute_index)
         {
@@ -498,16 +531,16 @@ void HashedArrayDictionary<dictionary_key_type>::blockToAttributes(const Block &
                 using AttributeType = typename Type::AttributeType;
                 using AttributeValueType = DictionaryValueType<AttributeType>;
 
-                auto & attribute_container = std::get<AttributeContainerType<AttributeValueType>>(attribute.container);
+                auto & attribute_container = std::get<AttributeContainerShardsType<AttributeValueType>>(attribute.containers)[shard];
                 attribute_container.emplace_back();
 
                 if (attribute_is_nullable)
                 {
-                    attribute.is_index_null->emplace_back();
+                    (*attribute.is_index_null)[shard].emplace_back();
 
                     if (column_value_to_insert.isNull())
                     {
-                        (*attribute.is_index_null).back() = true;
+                        (*attribute.is_index_null)[shard].back() = true;
                         return;
                     }
                 }
@@ -515,7 +548,7 @@ void HashedArrayDictionary<dictionary_key_type>::blockToAttributes(const Block &
                 if constexpr (std::is_same_v<AttributeValueType, StringRef>)
                 {
                     String & value_to_insert = column_value_to_insert.get<String>();
-                    StringRef string_in_arena_reference = copyStringInArena(string_arena, value_to_insert);
+                    StringRef string_in_arena_reference = copyStringInArena(*string_arenas[shard], value_to_insert);
                     attribute_container.back() = string_in_arena_reference;
                 }
                 else
@@ -528,23 +561,29 @@ void HashedArrayDictionary<dictionary_key_type>::blockToAttributes(const Block &
             callOnDictionaryAttributeType(attribute.type, type_call);
         }
 
-        ++element_count;
+        ++element_counts[shard];
+        ++total_element_count;
         keys_extractor.rollbackCurrentKey();
     }
 }
 
-template <DictionaryKeyType dictionary_key_type>
-void HashedArrayDictionary<dictionary_key_type>::resize(size_t total_rows)
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+void HashedArrayDictionary<dictionary_key_type, sharded>::resize(size_t total_rows)
 {
     if (unlikely(!total_rows))
         return;
 
-    key_attribute.container.reserve(total_rows);
+    /// In multi shards configuration it is pointless.
+    if constexpr (sharded)
+        return;
+
+    for (auto & container : key_attribute.containers)
+        container.reserve(total_rows);
 }
 
-template <DictionaryKeyType dictionary_key_type>
+template <DictionaryKeyType dictionary_key_type, bool sharded>
 template <typename KeysProvider>
-ColumnPtr HashedArrayDictionary<dictionary_key_type>::getAttributeColumn(
+ColumnPtr HashedArrayDictionary<dictionary_key_type, sharded>::getAttributeColumn(
     const Attribute & attribute,
     const DictionaryAttribute & dictionary_attribute,
     size_t keys_size,
@@ -638,16 +677,14 @@ ColumnPtr HashedArrayDictionary<dictionary_key_type>::getAttributeColumn(
     return result;
 }
 
-template <DictionaryKeyType dictionary_key_type>
+template <DictionaryKeyType dictionary_key_type, bool sharded>
 template <typename AttributeType, bool is_nullable, typename ValueSetter, typename DefaultValueExtractor>
-void HashedArrayDictionary<dictionary_key_type>::getItemsImpl(
+void HashedArrayDictionary<dictionary_key_type, sharded>::getItemsImpl(
     const Attribute & attribute,
     DictionaryKeysExtractor<dictionary_key_type> & keys_extractor,
     ValueSetter && set_value [[maybe_unused]],
     DefaultValueExtractor & default_value_extractor) const
 {
-    const auto & key_attribute_container = key_attribute.container;
-    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
     const size_t keys_size = keys_extractor.getKeysSize();
 
     size_t keys_found = 0;
@@ -655,6 +692,9 @@ void HashedArrayDictionary<dictionary_key_type>::getItemsImpl(
     for (size_t key_index = 0; key_index < keys_size; ++key_index)
     {
         auto key = keys_extractor.extractCurrentKey();
+        auto shard = getShard(key);
+        const auto & key_attribute_container = key_attribute.containers[shard];
+        const auto & attribute_container = std::get<AttributeContainerShardsType<AttributeType>>(attribute.containers)[shard];
 
         const auto it = key_attribute_container.find(key);
 
@@ -665,7 +705,7 @@ void HashedArrayDictionary<dictionary_key_type>::getItemsImpl(
             const auto & element = attribute_container[element_index];
 
             if constexpr (is_nullable)
-                set_value(key_index, element, (*attribute.is_index_null)[element_index]);
+                set_value(key_index, element, (*attribute.is_index_null)[shard][element_index]);
             else
                 set_value(key_index, element, false);
 
@@ -686,28 +726,39 @@ void HashedArrayDictionary<dictionary_key_type>::getItemsImpl(
     found_count.fetch_add(keys_found, std::memory_order_relaxed);
 }
 
-template <DictionaryKeyType dictionary_key_type>
+template <DictionaryKeyType dictionary_key_type, bool sharded>
 template <typename AttributeType, bool is_nullable, typename ValueSetter, typename DefaultValueExtractor>
-void HashedArrayDictionary<dictionary_key_type>::getItemsImpl(
+void HashedArrayDictionary<dictionary_key_type, sharded>::getItemsImpl(
     const Attribute & attribute,
-    const PaddedPODArray<ssize_t> & key_index_to_element_index,
+    const KeyIndexToElementIndex & key_index_to_element_index,
     ValueSetter && set_value,
     DefaultValueExtractor & default_value_extractor) const
 {
-    const auto & attribute_container = std::get<AttributeContainerType<AttributeType>>(attribute.container);
     const size_t keys_size = key_index_to_element_index.size();
+    size_t shard = 0;
 
     for (size_t key_index = 0; key_index < keys_size; ++key_index)
     {
-        bool key_exists = key_index_to_element_index[key_index] != -1;
-
-        if (key_exists)
+        ssize_t element_index;
+        if constexpr (sharded)
         {
-            size_t element_index = static_cast<size_t>(key_index_to_element_index[key_index]);
-            const auto & element = attribute_container[element_index];
+            element_index = key_index_to_element_index[key_index].first;
+            shard = key_index_to_element_index[key_index].second;
+        }
+        else
+        {
+            element_index = key_index_to_element_index[key_index];
+        }
+
+        if (element_index != -1)
+        {
+            const auto & attribute_container = std::get<AttributeContainerShardsType<AttributeType>>(attribute.containers)[shard];
+
+            size_t found_element_index = static_cast<size_t>(element_index);
+            const auto & element = attribute_container[found_element_index];
 
             if constexpr (is_nullable)
-                set_value(key_index, element, (*attribute.is_index_null)[element_index]);
+                set_value(key_index, element, (*attribute.is_index_null)[shard][found_element_index]);
             else
                 set_value(key_index, element, false);
         }
@@ -721,13 +772,17 @@ void HashedArrayDictionary<dictionary_key_type>::getItemsImpl(
     }
 }
 
-template <DictionaryKeyType dictionary_key_type>
-void HashedArrayDictionary<dictionary_key_type>::loadData()
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+void HashedArrayDictionary<dictionary_key_type, sharded>::loadData()
 {
     if (!source_ptr->hasUpdateField())
     {
-        QueryPipeline pipeline;
-        pipeline = QueryPipeline(source_ptr->loadAll());
+
+        std::optional<DictionaryParallelLoaderType> parallel_loader;
+        if constexpr (sharded)
+            parallel_loader.emplace(*this);
+
+        QueryPipeline pipeline(source_ptr->loadAll());
         DictionaryPipelineExecutor executor(pipeline, configuration.use_async_executor);
 
         UInt64 pull_time_microseconds = 0;
@@ -751,10 +806,22 @@ void HashedArrayDictionary<dictionary_key_type>::loadData()
 
             Stopwatch watch_process;
             resize(total_rows);
-            blockToAttributes(block);
+
+            if (parallel_loader)
+            {
+                parallel_loader->addBlock(block);
+            }
+            else
+            {
+                DictionaryKeysArenaHolder<dictionary_key_type> arena_holder;
+                blockToAttributes(block, arena_holder, /* shard = */ 0);
+            }
             process_time_microseconds += watch_process.elapsedMicroseconds();
         }
 
+        if (parallel_loader)
+            parallel_loader->finish();
+
         LOG_DEBUG(&Poco::Logger::get("HashedArrayDictionary"),
             "Finished {}reading {} blocks with {} rows from pipeline in {:.2f} sec and inserted into hashtable in {:.2f} sec",
             configuration.use_async_executor ? "asynchronous " : "",
@@ -765,14 +832,14 @@ void HashedArrayDictionary<dictionary_key_type>::loadData()
         updateData();
     }
 
-    if (configuration.require_nonempty && 0 == element_count)
+    if (configuration.require_nonempty && 0 == total_element_count)
         throw Exception(ErrorCodes::DICTIONARY_IS_EMPTY,
             "{}: dictionary source is empty and 'require_nonempty' property is set.",
             getFullName());
 }
 
-template <DictionaryKeyType dictionary_key_type>
-void HashedArrayDictionary<dictionary_key_type>::buildHierarchyParentToChildIndexIfNeeded()
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+void HashedArrayDictionary<dictionary_key_type, sharded>::buildHierarchyParentToChildIndexIfNeeded()
 {
     if (!dict_struct.hierarchical_attribute_index)
         return;
@@ -781,12 +848,13 @@ void HashedArrayDictionary<dictionary_key_type>::buildHierarchyParentToChildInde
         hierarchical_index = getHierarchicalIndex();
 }
 
-template <DictionaryKeyType dictionary_key_type>
-void HashedArrayDictionary<dictionary_key_type>::calculateBytesAllocated()
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+void HashedArrayDictionary<dictionary_key_type, sharded>::calculateBytesAllocated()
 {
     bytes_allocated += attributes.size() * sizeof(attributes.front());
 
-    bytes_allocated += key_attribute.container.size();
+    for (const auto & container : key_attribute.containers)
+        bytes_allocated += container.size();
 
     for (auto & attribute : attributes)
     {
@@ -796,26 +864,29 @@ void HashedArrayDictionary<dictionary_key_type>::calculateBytesAllocated()
             using AttributeType = typename Type::AttributeType;
             using ValueType = DictionaryValueType<AttributeType>;
 
-            const auto & container = std::get<AttributeContainerType<ValueType>>(attribute.container);
-            bytes_allocated += sizeof(AttributeContainerType<ValueType>);
-
-            if constexpr (std::is_same_v<ValueType, Array>)
+            for (const auto & container : std::get<AttributeContainerShardsType<ValueType>>(attribute.containers))
             {
-                /// It is not accurate calculations
-                bytes_allocated += sizeof(Array) * container.size();
-            }
-            else
-            {
-                bytes_allocated += container.allocated_bytes();
-            }
+                bytes_allocated += sizeof(AttributeContainerType<ValueType>);
 
-            bucket_count = container.capacity();
+                if constexpr (std::is_same_v<ValueType, Array>)
+                {
+                    /// It is not accurate calculations
+                    bytes_allocated += sizeof(Array) * container.size();
+                }
+                else
+                {
+                    bytes_allocated += container.allocated_bytes();
+                }
+
+                bucket_count = container.capacity();
+            }
         };
 
         callOnDictionaryAttributeType(attribute.type, type_call);
 
         if (attribute.is_index_null.has_value())
-            bytes_allocated += (*attribute.is_index_null).size();
+            for (const auto & container : attribute.is_index_null.value())
+                bytes_allocated += container.size();
     }
 
     if (update_field_loaded_block)
@@ -826,18 +897,19 @@ void HashedArrayDictionary<dictionary_key_type>::calculateBytesAllocated()
         hierarchical_index_bytes_allocated = hierarchical_index->getSizeInBytes();
         bytes_allocated += hierarchical_index_bytes_allocated;
     }
-
-    bytes_allocated += string_arena.allocatedBytes();
+    for (const auto & string_arena : string_arenas)
+        bytes_allocated += string_arena->allocatedBytes();
 }
 
-template <DictionaryKeyType dictionary_key_type>
-Pipe HashedArrayDictionary<dictionary_key_type>::read(const Names & column_names, size_t max_block_size, size_t num_streams) const
+template <DictionaryKeyType dictionary_key_type, bool sharded>
+Pipe HashedArrayDictionary<dictionary_key_type, sharded>::read(const Names & column_names, size_t max_block_size, size_t num_streams) const
 {
     PaddedPODArray<HashedArrayDictionary::KeyType> keys;
-    keys.reserve(key_attribute.container.size());
+    keys.reserve(total_element_count);
 
-    for (auto & [key, _] : key_attribute.container)
-        keys.emplace_back(key);
+    for (const auto & container : key_attribute.containers)
+        for (auto & [key, _] : container)
+            keys.emplace_back(key);
 
     ColumnsWithTypeAndName key_columns;
 
@@ -858,8 +930,10 @@ Pipe HashedArrayDictionary<dictionary_key_type>::read(const Names & column_names
     return result;
 }
 
-template class HashedArrayDictionary<DictionaryKeyType::Simple>;
-template class HashedArrayDictionary<DictionaryKeyType::Complex>;
+template class HashedArrayDictionary<DictionaryKeyType::Simple, /* sharded */ false>;
+template class HashedArrayDictionary<DictionaryKeyType::Simple, /* sharded */ true>;
+template class HashedArrayDictionary<DictionaryKeyType::Complex, /* sharded */ false>;
+template class HashedArrayDictionary<DictionaryKeyType::Complex, /* sharded */ true>;
 
 void registerDictionaryArrayHashed(DictionaryFactory & factory)
 {
@@ -886,7 +960,14 @@ void registerDictionaryArrayHashed(DictionaryFactory & factory)
         const DictionaryLifetime dict_lifetime{config, config_prefix + ".lifetime"};
         const bool require_nonempty = config.getBool(config_prefix + ".require_nonempty", false);
 
-        HashedArrayDictionaryStorageConfiguration configuration{require_nonempty, dict_lifetime};
+        std::string dictionary_layout_name = dictionary_key_type == DictionaryKeyType::Simple ? "hashed_array" : "complex_key_hashed_array";
+        std::string dictionary_layout_prefix = ".layout." + dictionary_layout_name;
+
+        Int64 shards = config.getInt(config_prefix + dictionary_layout_prefix + ".shards", 1);
+        if (shards <= 0 || 128 < shards)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,"{}: SHARDS parameter should be within [1, 128]", full_name);
+
+        HashedArrayDictionaryStorageConfiguration configuration{require_nonempty, dict_lifetime, static_cast<size_t>(shards)};
 
         ContextMutablePtr context = copyContextAndApplySettingsFromDictionaryConfig(global_context, config, config_prefix);
         const auto & settings = context->getSettingsRef();
@@ -895,9 +976,17 @@ void registerDictionaryArrayHashed(DictionaryFactory & factory)
         configuration.use_async_executor = clickhouse_source && clickhouse_source->isLocal() && settings.dictionary_use_async_executor;
 
         if (dictionary_key_type == DictionaryKeyType::Simple)
-            return std::make_unique<HashedArrayDictionary<DictionaryKeyType::Simple>>(dict_id, dict_struct, std::move(source_ptr), configuration);
+        {
+            if (shards > 1)
+                return std::make_unique<HashedArrayDictionary<DictionaryKeyType::Simple, true>>(dict_id, dict_struct, std::move(source_ptr), configuration);
+            return std::make_unique<HashedArrayDictionary<DictionaryKeyType::Simple, false>>(dict_id, dict_struct, std::move(source_ptr), configuration);
+        }
         else
-            return std::make_unique<HashedArrayDictionary<DictionaryKeyType::Complex>>(dict_id, dict_struct, std::move(source_ptr), configuration);
+        {
+            if (shards > 1)
+                return std::make_unique<HashedArrayDictionary<DictionaryKeyType::Complex, true>>(dict_id, dict_struct, std::move(source_ptr), configuration);
+            return std::make_unique<HashedArrayDictionary<DictionaryKeyType::Complex, false>>(dict_id, dict_struct, std::move(source_ptr), configuration);
+        }
     };
 
     factory.registerLayout("hashed_array",
diff --git a/src/Dictionaries/HashedArrayDictionary.h b/src/Dictionaries/HashedArrayDictionary.h
index 3b9446e4e8f..606008ce921 100644
--- a/src/Dictionaries/HashedArrayDictionary.h
+++ b/src/Dictionaries/HashedArrayDictionary.h
@@ -13,6 +13,7 @@
 #include <Dictionaries/IDictionary.h>
 #include <Dictionaries/IDictionarySource.h>
 #include <Dictionaries/DictionaryHelpers.h>
+#include <Dictionaries/HashedDictionaryParallelLoader.h>
 
 /** This dictionary stores all attributes in arrays.
   * Key is stored in hash table and value is index into attribute array.
@@ -25,12 +26,17 @@ struct HashedArrayDictionaryStorageConfiguration
 {
     const bool require_nonempty;
     const DictionaryLifetime lifetime;
+    size_t shards = 1;
+    size_t shard_load_queue_backlog = 10000;
     bool use_async_executor = false;
 };
 
-template <DictionaryKeyType dictionary_key_type>
+template <DictionaryKeyType dictionary_key_type, bool sharded>
 class HashedArrayDictionary final : public IDictionary
 {
+    using DictionaryParallelLoaderType = HashedDictionaryImpl::HashedDictionaryParallelLoader<dictionary_key_type, HashedArrayDictionary<dictionary_key_type, sharded>>;
+    friend class HashedDictionaryImpl::HashedDictionaryParallelLoader<dictionary_key_type, HashedArrayDictionary<dictionary_key_type, sharded>>;
+
 public:
     using KeyType = std::conditional_t<dictionary_key_type == DictionaryKeyType::Simple, UInt64, StringRef>;
 
@@ -63,13 +69,13 @@ public:
 
     double getHitRate() const override { return 1.0; }
 
-    size_t getElementCount() const override { return element_count; }
+    size_t getElementCount() const override { return total_element_count; }
 
-    double getLoadFactor() const override { return static_cast<double>(element_count) / bucket_count; }
+    double getLoadFactor() const override { return static_cast<double>(total_element_count) / bucket_count; }
 
     std::shared_ptr<const IExternalLoadable> clone() const override
     {
-        return std::make_shared<HashedArrayDictionary<dictionary_key_type>>(getDictionaryID(), dict_struct, source_ptr->clone(), configuration, update_field_loaded_block);
+        return std::make_shared<HashedArrayDictionary<dictionary_key_type, sharded>>(getDictionaryID(), dict_struct, source_ptr->clone(), configuration, update_field_loaded_block);
     }
 
     DictionarySourcePtr getSource() const override { return source_ptr; }
@@ -132,50 +138,54 @@ private:
     template <typename Value>
     using AttributeContainerType = std::conditional_t<std::is_same_v<Value, Array>, std::vector<Value>, PaddedPODArray<Value>>;
 
+    template <typename Value>
+    using AttributeContainerShardsType = std::vector<AttributeContainerType<Value>>;
+
     struct Attribute final
     {
         AttributeUnderlyingType type;
 
         std::variant<
-            AttributeContainerType<UInt8>,
-            AttributeContainerType<UInt16>,
-            AttributeContainerType<UInt32>,
-            AttributeContainerType<UInt64>,
-            AttributeContainerType<UInt128>,
-            AttributeContainerType<UInt256>,
-            AttributeContainerType<Int8>,
-            AttributeContainerType<Int16>,
-            AttributeContainerType<Int32>,
-            AttributeContainerType<Int64>,
-            AttributeContainerType<Int128>,
-            AttributeContainerType<Int256>,
-            AttributeContainerType<Decimal32>,
-            AttributeContainerType<Decimal64>,
-            AttributeContainerType<Decimal128>,
-            AttributeContainerType<Decimal256>,
-            AttributeContainerType<DateTime64>,
-            AttributeContainerType<Float32>,
-            AttributeContainerType<Float64>,
-            AttributeContainerType<UUID>,
-            AttributeContainerType<IPv4>,
-            AttributeContainerType<IPv6>,
-            AttributeContainerType<StringRef>,
-            AttributeContainerType<Array>>
-            container;
+            AttributeContainerShardsType<UInt8>,
+            AttributeContainerShardsType<UInt16>,
+            AttributeContainerShardsType<UInt32>,
+            AttributeContainerShardsType<UInt64>,
+            AttributeContainerShardsType<UInt128>,
+            AttributeContainerShardsType<UInt256>,
+            AttributeContainerShardsType<Int8>,
+            AttributeContainerShardsType<Int16>,
+            AttributeContainerShardsType<Int32>,
+            AttributeContainerShardsType<Int64>,
+            AttributeContainerShardsType<Int128>,
+            AttributeContainerShardsType<Int256>,
+            AttributeContainerShardsType<Decimal32>,
+            AttributeContainerShardsType<Decimal64>,
+            AttributeContainerShardsType<Decimal128>,
+            AttributeContainerShardsType<Decimal256>,
+            AttributeContainerShardsType<DateTime64>,
+            AttributeContainerShardsType<Float32>,
+            AttributeContainerShardsType<Float64>,
+            AttributeContainerShardsType<UUID>,
+            AttributeContainerShardsType<IPv4>,
+            AttributeContainerShardsType<IPv6>,
+            AttributeContainerShardsType<StringRef>,
+            AttributeContainerShardsType<Array>>
+            containers;
 
-        std::optional<std::vector<bool>> is_index_null;
+        /// One container per shard
+        using RowsMask = std::vector<bool>;
+        std::optional<std::vector<RowsMask>> is_index_null;
     };
 
     struct KeyAttribute final
     {
-
-        KeyContainerType container;
-
+        /// One container per shard
+        std::vector<KeyContainerType> containers;
     };
 
     void createAttributes();
 
-    void blockToAttributes(const Block & block);
+    void blockToAttributes(const Block & block, DictionaryKeysArenaHolder<dictionary_key_type> & arena_holder, size_t shard);
 
     void updateData();
 
@@ -185,6 +195,22 @@ private:
 
     void calculateBytesAllocated();
 
+    UInt64 getShard(UInt64 key) const
+    {
+        if constexpr (!sharded)
+            return 0;
+        /// NOTE: function here should not match with the DefaultHash<> since
+        /// it used for the HashMap/sparse_hash_map.
+        return intHashCRC32(key) % configuration.shards;
+    }
+
+    UInt64 getShard(StringRef key) const
+    {
+        if constexpr (!sharded)
+            return 0;
+        return StringRefHash()(key) % configuration.shards;
+    }
+
     template <typename KeysProvider>
     ColumnPtr getAttributeColumn(
         const Attribute & attribute,
@@ -200,10 +226,13 @@ private:
         ValueSetter && set_value,
         DefaultValueExtractor & default_value_extractor) const;
 
+
+    using KeyIndexToElementIndex = std::conditional_t<sharded, PaddedPODArray<std::pair<ssize_t, UInt8>>, PaddedPODArray<ssize_t>>;
+
     template <typename AttributeType, bool is_nullable, typename ValueSetter, typename DefaultValueExtractor>
     void getItemsImpl(
         const Attribute & attribute,
-        const PaddedPODArray<ssize_t> & key_index_to_element_index,
+        const KeyIndexToElementIndex & key_index_to_element_index,
         ValueSetter && set_value,
         DefaultValueExtractor & default_value_extractor) const;
 
@@ -215,6 +244,8 @@ private:
 
     void resize(size_t total_rows);
 
+    Poco::Logger * log;
+
     const DictionaryStructure dict_struct;
     const DictionarySourcePtr source_ptr;
     const HashedArrayDictionaryStorageConfiguration configuration;
@@ -225,17 +256,20 @@ private:
 
     size_t bytes_allocated = 0;
     size_t hierarchical_index_bytes_allocated = 0;
-    size_t element_count = 0;
+    std::atomic<size_t> total_element_count = 0;
+    std::vector<size_t> element_counts;
     size_t bucket_count = 0;
     mutable std::atomic<size_t> query_count{0};
     mutable std::atomic<size_t> found_count{0};
 
     BlockPtr update_field_loaded_block;
-    Arena string_arena;
+    std::vector<std::unique_ptr<Arena>> string_arenas;
     DictionaryHierarchicalParentToChildIndexPtr hierarchical_index;
 };
 
-extern template class HashedArrayDictionary<DictionaryKeyType::Simple>;
-extern template class HashedArrayDictionary<DictionaryKeyType::Complex>;
+extern template class HashedArrayDictionary<DictionaryKeyType::Simple, false>;
+extern template class HashedArrayDictionary<DictionaryKeyType::Simple, true>;
+extern template class HashedArrayDictionary<DictionaryKeyType::Complex, false>;
+extern template class HashedArrayDictionary<DictionaryKeyType::Complex, true>;
 
 }
diff --git a/src/Dictionaries/HashedDictionary.h b/src/Dictionaries/HashedDictionary.h
index 376637189dd..8009ffab80a 100644
--- a/src/Dictionaries/HashedDictionary.h
+++ b/src/Dictionaries/HashedDictionary.h
@@ -71,7 +71,8 @@ struct HashedDictionaryConfiguration
 template <DictionaryKeyType dictionary_key_type, bool sparse, bool sharded>
 class HashedDictionary final : public IDictionary
 {
-    friend class HashedDictionaryParallelLoader<dictionary_key_type, sparse, sharded>;
+    using DictionaryParallelLoaderType = HashedDictionaryParallelLoader<dictionary_key_type, HashedDictionary<dictionary_key_type, sparse, sharded>>;
+    friend class HashedDictionaryParallelLoader<dictionary_key_type, HashedDictionary<dictionary_key_type, sparse, sharded>>;
 
 public:
     using KeyType = std::conditional_t<dictionary_key_type == DictionaryKeyType::Simple, UInt64, StringRef>;
@@ -987,7 +988,7 @@ void HashedDictionary<dictionary_key_type, sparse, sharded>::getItemsImpl(
         auto key = keys_extractor.extractCurrentKey();
         auto shard = getShard(key);
 
-        const auto & container = attribute_containers[getShard(key)];
+        const auto & container = attribute_containers[shard];
         const auto it = container.find(key);
 
         if (it != container.end())
@@ -1020,11 +1021,11 @@ void HashedDictionary<dictionary_key_type, sparse, sharded>::loadData()
 {
     if (!source_ptr->hasUpdateField())
     {
-        std::optional<HashedDictionaryParallelLoader<dictionary_key_type, sparse, sharded>> parallel_loader;
+        std::optional<DictionaryParallelLoaderType> parallel_loader;
         if constexpr (sharded)
             parallel_loader.emplace(*this);
 
-        QueryPipeline pipeline = QueryPipeline(source_ptr->loadAll());
+        QueryPipeline pipeline(source_ptr->loadAll());
 
         DictionaryPipelineExecutor executor(pipeline, configuration.use_async_executor);
         Block block;
diff --git a/src/Dictionaries/HashedDictionaryParallelLoader.h b/src/Dictionaries/HashedDictionaryParallelLoader.h
index b52158c7fcb..907a987555e 100644
--- a/src/Dictionaries/HashedDictionaryParallelLoader.h
+++ b/src/Dictionaries/HashedDictionaryParallelLoader.h
@@ -38,13 +38,12 @@ namespace DB::HashedDictionaryImpl
 {
 
 /// Implementation parallel dictionary load for SHARDS
-template <DictionaryKeyType dictionary_key_type, bool sparse, bool sharded>
+template <DictionaryKeyType dictionary_key_type, typename DictionaryType>
 class HashedDictionaryParallelLoader : public boost::noncopyable
 {
-    using HashedDictionary = HashedDictionary<dictionary_key_type, sparse, sharded>;
 
 public:
-    explicit HashedDictionaryParallelLoader(HashedDictionary & dictionary_)
+    explicit HashedDictionaryParallelLoader(DictionaryType & dictionary_)
         : dictionary(dictionary_)
         , shards(dictionary.configuration.shards)
         , pool(CurrentMetrics::HashedDictionaryThreads, CurrentMetrics::HashedDictionaryThreadsActive, CurrentMetrics::HashedDictionaryThreadsScheduled, shards)
@@ -118,7 +117,7 @@ public:
     }
 
 private:
-    HashedDictionary & dictionary;
+    DictionaryType & dictionary;
     const size_t shards;
     ThreadPool pool;
     std::vector<std::optional<ConcurrentBoundedQueue<Block>>> shards_queues;
diff --git a/src/Dictionaries/RangeHashedDictionary.h b/src/Dictionaries/RangeHashedDictionary.h
index 9be9fa1d0d4..c44bffe42e1 100644
--- a/src/Dictionaries/RangeHashedDictionary.h
+++ b/src/Dictionaries/RangeHashedDictionary.h
@@ -683,7 +683,7 @@ void RangeHashedDictionary<dictionary_key_type>::loadData()
 
     if (configuration.require_nonempty && 0 == element_count)
         throw Exception(ErrorCodes::DICTIONARY_IS_EMPTY,
-            "{}: dictionary source is empty and 'require_nonempty' property is set.");
+            "{}: dictionary source is empty and 'require_nonempty' property is set.", getFullName());
 }
 
 template <DictionaryKeyType dictionary_key_type>
diff --git a/src/Dictionaries/SSDCacheDictionaryStorage.h b/src/Dictionaries/SSDCacheDictionaryStorage.h
index 6c98ce9c180..68f727c019c 100644
--- a/src/Dictionaries/SSDCacheDictionaryStorage.h
+++ b/src/Dictionaries/SSDCacheDictionaryStorage.h
@@ -481,7 +481,7 @@ public:
         if (file.fd == -1)
         {
             auto error_code = (errno == ENOENT) ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE;
-            throwFromErrnoWithPath("Cannot open file " + file_path, file_path, error_code);
+            ErrnoException::throwFromPath(error_code, file_path, "Cannot open file {}", file_path);
         }
 
         allocateSizeForNextPartition();
@@ -490,7 +490,8 @@ public:
     void allocateSizeForNextPartition()
     {
         if (preallocateDiskSpace(file.fd, current_blocks_size * block_size, block_size * file_blocks_size) < 0)
-            throwFromErrnoWithPath("Cannot preallocate space for the file " + file_path, file_path, ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+            ErrnoException::throwFromPath(
+                ErrorCodes::CANNOT_ALLOCATE_MEMORY, file_path, "Cannot preallocate space for the file {}", file_path);
 
         current_blocks_size += file_blocks_size;
     }
@@ -552,11 +553,11 @@ public:
         Stopwatch watch;
         #if defined(OS_DARWIN)
         if (::fsync(file.fd) < 0)
-            throwFromErrnoWithPath("Cannot fsync " + file_path, file_path, ErrorCodes::CANNOT_FSYNC);
-        #else
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_FSYNC, file_path, "Cannot fsync {}", file_path);
+#    else
         if (::fdatasync(file.fd) < 0)
-            throwFromErrnoWithPath("Cannot fdatasync " + file_path, file_path, ErrorCodes::CANNOT_FSYNC);
-        #endif
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_FSYNC, file_path, "Cannot fdatasync {}", file_path);
+#    endif
         ProfileEvents::increment(ProfileEvents::FileSyncElapsedMicroseconds, watch.elapsedMicroseconds());
 
         current_block_index += buffer_size_in_blocks;
@@ -598,13 +599,13 @@ public:
         while (io_submit(aio_context.ctx, 1, &request_ptr) != 1)
         {
             if (errno != EINTR)
-                throwFromErrno("io_submit: Failed to submit a request for asynchronous IO", ErrorCodes::CANNOT_IO_SUBMIT);
+                throw ErrnoException(ErrorCodes::CANNOT_IO_SUBMIT, "io_submit: Failed to submit a request for asynchronous IO");
         }
 
         while (io_getevents(aio_context.ctx, 1, 1, &event, nullptr) != 1)
         {
             if (errno != EINTR)
-                throwFromErrno("io_getevents: Failed to get an event for asynchronous IO", ErrorCodes::CANNOT_IO_GETEVENTS);
+                throw ErrnoException(ErrorCodes::CANNOT_IO_GETEVENTS, "io_getevents: Failed to get an event for asynchronous IO");
         }
 
         auto read_bytes = eventResult(event);
@@ -692,7 +693,7 @@ public:
             while (to_pop < to_push && (popped = io_getevents(aio_context.ctx, to_push - to_pop, to_push - to_pop, &events[to_pop], nullptr)) <= 0)
             {
                 if (errno != EINTR)
-                    throwFromErrno("io_getevents: Failed to get an event for asynchronous IO", ErrorCodes::CANNOT_IO_GETEVENTS);
+                    throw ErrnoException(ErrorCodes::CANNOT_IO_GETEVENTS, "io_getevents: Failed to get an event for asynchronous IO");
             }
 
             for (size_t i = to_pop; i < to_pop + popped; ++i)
@@ -743,7 +744,7 @@ public:
             while (new_tasks_count > 0 && (pushed = io_submit(aio_context.ctx, new_tasks_count, &pointers[to_push])) <= 0)
             {
                 if (errno != EINTR)
-                    throwFromErrno("io_submit: Failed to submit a request for asynchronous IO", ErrorCodes::CANNOT_IO_SUBMIT);
+                    throw ErrnoException(ErrorCodes::CANNOT_IO_SUBMIT, "io_submit: Failed to submit a request for asynchronous IO");
             }
 
             to_push += pushed;
diff --git a/src/Dictionaries/XDBCDictionarySource.cpp b/src/Dictionaries/XDBCDictionarySource.cpp
index 23dc7db508d..080f7db96be 100644
--- a/src/Dictionaries/XDBCDictionarySource.cpp
+++ b/src/Dictionaries/XDBCDictionarySource.cpp
@@ -76,7 +76,7 @@ XDBCDictionarySource::XDBCDictionarySource(
     , load_all_query(query_builder.composeLoadAllQuery())
     , bridge_helper(bridge_)
     , bridge_url(bridge_helper->getMainURI())
-    , timeouts(ConnectionTimeouts::getHTTPTimeouts(context_->getSettingsRef(), {context_->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0}))
+    , timeouts(ConnectionTimeouts::getHTTPTimeouts(context_->getSettingsRef(), context_->getServerSettings().keep_alive_timeout))
 {
     auto url_params = bridge_helper->getURLParams(max_block_size);
     for (const auto & [name, value] : url_params)
diff --git a/src/Disks/DiskLocal.cpp b/src/Disks/DiskLocal.cpp
index 394c08e4876..5e77ff61789 100644
--- a/src/Disks/DiskLocal.cpp
+++ b/src/Disks/DiskLocal.cpp
@@ -8,6 +8,7 @@
 #include <Common/filesystemHelpers.h>
 #include <Common/quoteString.h>
 #include <Common/atomicRename.h>
+#include <Common/formatReadable.h>
 #include <Disks/IO/createReadBufferFromFileBase.h>
 #include <Disks/loadLocalDiskConfig.h>
 #include <Disks/TemporaryFileOnDisk.h>
@@ -359,21 +360,21 @@ void DiskLocal::removeFile(const String & path)
 {
     auto fs_path = fs::path(disk_path) / path;
     if (0 != unlink(fs_path.c_str()))
-        throwFromErrnoWithPath("Cannot unlink file " + fs_path.string(), fs_path, ErrorCodes::CANNOT_UNLINK);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_UNLINK, fs_path, "Cannot unlink file {}", fs_path);
 }
 
 void DiskLocal::removeFileIfExists(const String & path)
 {
     auto fs_path = fs::path(disk_path) / path;
     if (0 != unlink(fs_path.c_str()) && errno != ENOENT)
-        throwFromErrnoWithPath("Cannot unlink file " + fs_path.string(), fs_path, ErrorCodes::CANNOT_UNLINK);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_UNLINK, fs_path, "Cannot unlink file {}", fs_path);
 }
 
 void DiskLocal::removeDirectory(const String & path)
 {
     auto fs_path = fs::path(disk_path) / path;
     if (0 != rmdir(fs_path.c_str()))
-        throwFromErrnoWithPath("Cannot rmdir " + fs_path.string(), fs_path, ErrorCodes::CANNOT_RMDIR);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_RMDIR, fs_path, "Cannot remove directory {}", fs_path);
 }
 
 void DiskLocal::removeRecursive(const String & path)
@@ -412,7 +413,7 @@ void DiskLocal::truncateFile(const String & path, size_t size)
 {
     int res = truncate((fs::path(disk_path) / path).string().data(), size);
     if (-1 == res)
-        throwFromErrnoWithPath("Cannot truncate file " + path, path, ErrorCodes::CANNOT_TRUNCATE_FILE);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_TRUNCATE_FILE, path, "Cannot truncate {}", path);
 }
 
 void DiskLocal::createFile(const String & path)
@@ -709,7 +710,7 @@ struct stat DiskLocal::stat(const String & path) const
     auto full_path = fs::path(disk_path) / path;
     if (::stat(full_path.string().c_str(), &st) == 0)
         return st;
-    DB::throwFromErrnoWithPath("Cannot stat file: " + path, path, DB::ErrorCodes::CANNOT_STAT);
+    DB::ErrnoException::throwFromPath(DB::ErrorCodes::CANNOT_STAT, path, "Cannot stat file: {}", path);
 }
 
 void DiskLocal::chmod(const String & path, mode_t mode)
@@ -717,7 +718,7 @@ void DiskLocal::chmod(const String & path, mode_t mode)
     auto full_path = fs::path(disk_path) / path;
     if (::chmod(full_path.string().c_str(), mode) == 0)
         return;
-    DB::throwFromErrnoWithPath("Cannot chmod file: " + path, path, DB::ErrorCodes::PATH_ACCESS_DENIED);
+    DB::ErrnoException::throwFromPath(DB::ErrorCodes::PATH_ACCESS_DENIED, path, "Cannot chmod file: {}", path);
 }
 
 void registerDiskLocal(DiskFactory & factory, bool global_skip_access_check)
diff --git a/src/Disks/DiskSelector.cpp b/src/Disks/DiskSelector.cpp
index 415e10a55fc..dad1c728560 100644
--- a/src/Disks/DiskSelector.cpp
+++ b/src/Disks/DiskSelector.cpp
@@ -44,9 +44,9 @@ void DiskSelector::initialize(const Poco::Util::AbstractConfiguration & config,
         if (disk_name == default_disk_name)
             has_default_disk = true;
 
-        auto disk_config_prefix = config_prefix + "." + disk_name;
+        const auto disk_config_prefix = config_prefix + "." + disk_name;
 
-        if (disk_validator && !disk_validator(config, disk_config_prefix))
+        if (disk_validator && !disk_validator(config, disk_config_prefix, disk_name))
             continue;
 
         disks.emplace(disk_name, factory.create(disk_name, config, disk_config_prefix, context, disks));
diff --git a/src/Disks/DiskSelector.h b/src/Disks/DiskSelector.h
index c91c3acb3bd..6669b428158 100644
--- a/src/Disks/DiskSelector.h
+++ b/src/Disks/DiskSelector.h
@@ -23,7 +23,7 @@ public:
     DiskSelector() = default;
     DiskSelector(const DiskSelector & from) = default;
 
-    using DiskValidator = std::function<bool(const Poco::Util::AbstractConfiguration & config, const String & disk_config_prefix)>;
+    using DiskValidator = std::function<bool(const Poco::Util::AbstractConfiguration & config, const String & disk_config_prefix, const String & disk_name)>;
     void initialize(const Poco::Util::AbstractConfiguration & config, const String & config_prefix, ContextPtr context, DiskValidator disk_validator = {});
 
     DiskSelectorPtr updateFromConfig(
diff --git a/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp b/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
index 833614c4bd8..f507fb207e5 100644
--- a/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
+++ b/src/Disks/IO/CachedOnDiskReadBufferFromFile.cpp
@@ -177,22 +177,13 @@ CachedOnDiskReadBufferFromFile::getCacheReadBuffer(const FileSegment & file_segm
     }
 
     ReadSettings local_read_settings{settings};
-    local_read_settings.local_fs_prefetch = false;
-    if (local_read_settings.local_fs_method != LocalFSReadMethod::pread_threadpool)
-        local_read_settings.local_fs_method = LocalFSReadMethod::pread;
+    local_read_settings.local_fs_method = LocalFSReadMethod::pread;
 
     if (use_external_buffer)
         local_read_settings.local_fs_buffer_size = 0;
 
-    cache_file_reader = createReadBufferFromFileBase(
-        path,
-        local_read_settings,
-        std::nullopt,
-        std::nullopt,
-        file_segment.getFlagsForLocalRead(),
-        /*existing_memory=*/nullptr,
-        /*alignment=*/0,
-        /*use_external_buffer=*/true);
+    cache_file_reader
+        = createReadBufferFromFileBase(path, local_read_settings, std::nullopt, std::nullopt, file_segment.getFlagsForLocalRead());
 
     if (getFileSizeFromReadBuffer(*cache_file_reader) == 0)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to read from an empty cache file: {}", path);
@@ -540,7 +531,7 @@ bool CachedOnDiskReadBufferFromFile::completeFileSegmentAndGetNext()
         return false;
 
     current_file_segment = &file_segments->front();
-    current_file_segment->use();
+    current_file_segment->increasePriority();
     implementation_buffer = getImplementationBuffer(*current_file_segment);
 
     LOG_TEST(
@@ -868,7 +859,7 @@ bool CachedOnDiskReadBufferFromFile::nextImplStep()
     else
     {
         implementation_buffer = getImplementationBuffer(file_segments->front());
-        file_segments->front().use();
+        file_segments->front().increasePriority();
     }
 
     chassert(!internal_buffer.empty());
diff --git a/src/Disks/IO/IOUringReader.cpp b/src/Disks/IO/IOUringReader.cpp
index 0e11b42ab01..4c9f665093d 100644
--- a/src/Disks/IO/IOUringReader.cpp
+++ b/src/Disks/IO/IOUringReader.cpp
@@ -77,7 +77,7 @@ IOUringReader::IOUringReader(uint32_t entries_)
 
     int ret = io_uring_queue_init_params(entries_, &ring, &params);
     if (ret < 0)
-        throwFromErrno("Failed initializing io_uring", ErrorCodes::IO_URING_INIT_FAILED, -ret);
+        ErrnoException::throwWithErrno(ErrorCodes::IO_URING_INIT_FAILED, -ret, "Failed initializing io_uring");
 
     cq_entries = params.cq_entries;
     ring_completion_monitor = std::make_unique<ThreadFromGlobalPool>([this] { monitorRing(); });
diff --git a/src/Disks/IO/ReadBufferFromWebServer.cpp b/src/Disks/IO/ReadBufferFromWebServer.cpp
index 46d8c41ff78..90cd5285875 100644
--- a/src/Disks/IO/ReadBufferFromWebServer.cpp
+++ b/src/Disks/IO/ReadBufferFromWebServer.cpp
@@ -54,8 +54,7 @@ std::unique_ptr<ReadBuffer> ReadBufferFromWebServer::initialize()
     }
 
     const auto & settings = context->getSettingsRef();
-    const auto & config = context->getConfigRef();
-    Poco::Timespan http_keep_alive_timeout{config.getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0};
+    const auto & server_settings = context->getServerSettings();
 
     auto res = std::make_unique<ReadWriteBufferFromHTTP>(
         uri,
@@ -65,7 +64,7 @@ std::unique_ptr<ReadBuffer> ReadBufferFromWebServer::initialize()
                            settings.http_send_timeout,
                            std::max(Poco::Timespan(settings.http_receive_timeout.totalSeconds(), 0), Poco::Timespan(20, 0)),
                            settings.tcp_keep_alive_timeout,
-                           http_keep_alive_timeout),
+                           server_settings.keep_alive_timeout),
         credentials,
         0,
         buf_size,
diff --git a/src/Disks/IO/ThreadPoolReader.cpp b/src/Disks/IO/ThreadPoolReader.cpp
index 2ffae9b3338..bb295643726 100644
--- a/src/Disks/IO/ThreadPoolReader.cpp
+++ b/src/Disks/IO/ThreadPoolReader.cpp
@@ -175,9 +175,8 @@ std::future<IAsynchronousReader::Result> ThreadPoolReader::submit(Request reques
                 else
                 {
                     ProfileEvents::increment(ProfileEvents::ReadBufferFromFileDescriptorReadFailed);
-                    promise.set_exception(std::make_exception_ptr(ErrnoException(
-                        fmt::format("Cannot read from file {}, {}", fd, errnoToString()),
-                        ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, errno)));
+                    promise.set_exception(std::make_exception_ptr(
+                        ErrnoException(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, "Cannot read from file {}", fd)));
                     return future;
                 }
             }
@@ -233,7 +232,7 @@ std::future<IAsynchronousReader::Result> ThreadPoolReader::submit(Request reques
             if (-1 == res && errno != EINTR)
             {
                 ProfileEvents::increment(ProfileEvents::ReadBufferFromFileDescriptorReadFailed);
-                throwFromErrno(fmt::format("Cannot read from file {}", fd), ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+                throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, "Cannot read from file {}", fd);
             }
 
             bytes_read += res;
diff --git a/src/Disks/IO/ThreadPoolRemoteFSReader.cpp b/src/Disks/IO/ThreadPoolRemoteFSReader.cpp
index 9d079dd3b70..f3caf62ffd5 100644
--- a/src/Disks/IO/ThreadPoolRemoteFSReader.cpp
+++ b/src/Disks/IO/ThreadPoolRemoteFSReader.cpp
@@ -26,6 +26,7 @@ namespace ProfileEvents
     extern const Event ThreadpoolReaderSubmitReadSynchronously;
     extern const Event ThreadpoolReaderSubmitReadSynchronouslyBytes;
     extern const Event ThreadpoolReaderSubmitReadSynchronouslyMicroseconds;
+    extern const Event ThreadpoolReaderSubmitLookupInCacheMicroseconds;
     extern const Event AsynchronousReaderIgnoredBytes;
 }
 
@@ -83,7 +84,13 @@ std::future<IAsynchronousReader::Result> ThreadPoolRemoteFSReader::submit(Reques
         reader.seek(request.offset, SEEK_SET);
     }
 
-    if (reader.isContentCached(request.offset, request.size))
+    bool is_content_cached = false;
+    {
+        ProfileEventTimeIncrement<Microseconds> elapsed(ProfileEvents::ThreadpoolReaderSubmitLookupInCacheMicroseconds);
+        is_content_cached = reader.isContentCached(request.offset, request.size);
+    }
+
+    if (is_content_cached)
     {
         std::promise<Result> promise;
         std::future<Result> future = promise.get_future();
diff --git a/src/Disks/IO/WriteBufferFromTemporaryFile.cpp b/src/Disks/IO/WriteBufferFromTemporaryFile.cpp
index 03713adef02..c47fe281176 100644
--- a/src/Disks/IO/WriteBufferFromTemporaryFile.cpp
+++ b/src/Disks/IO/WriteBufferFromTemporaryFile.cpp
@@ -29,8 +29,7 @@ public:
 
         off_t res = lseek(fd, 0, SEEK_SET);
         if (-1 == res)
-            throwFromErrnoWithPath("Cannot reread temporary file " + file_name, file_name,
-                                   ErrorCodes::CANNOT_SEEK_THROUGH_FILE);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, file_name, "Cannot reread temporary file {}", file_name);
 
         return std::make_unique<ReadBufferFromTemporaryWriteBuffer>(fd, file_name, std::move(origin->tmp_file));
     }
diff --git a/src/Disks/IO/createReadBufferFromFileBase.cpp b/src/Disks/IO/createReadBufferFromFileBase.cpp
index 80dbc8df988..236dd43e9ee 100644
--- a/src/Disks/IO/createReadBufferFromFileBase.cpp
+++ b/src/Disks/IO/createReadBufferFromFileBase.cpp
@@ -101,12 +101,16 @@ std::unique_ptr<ReadBufferFromFileBase> createReadBufferFromFileBase(
         else if (settings.local_fs_method == LocalFSReadMethod::io_uring)
         {
 #if USE_LIBURING
-            static std::shared_ptr<IOUringReader> reader = std::make_shared<IOUringReader>(512);
-            if (!reader->isSupported())
+            auto global_context = Context::getGlobalContextInstance();
+            if (!global_context)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot obtain io_uring reader (global context not initialized)");
+
+            auto & reader = global_context->getIOURingReader();
+            if (!reader.isSupported())
                 throw Exception(ErrorCodes::UNSUPPORTED_METHOD, "io_uring is not supported by this system");
 
             res = std::make_unique<AsynchronousReadBufferFromFileWithDescriptorsCache>(
-                *reader,
+                reader,
                 settings.priority,
                 filename,
                 buffer_size,
diff --git a/src/Disks/LocalDirectorySyncGuard.cpp b/src/Disks/LocalDirectorySyncGuard.cpp
index 1ac57df63fb..6aff40cd47d 100644
--- a/src/Disks/LocalDirectorySyncGuard.cpp
+++ b/src/Disks/LocalDirectorySyncGuard.cpp
@@ -31,8 +31,8 @@ LocalDirectorySyncGuard::LocalDirectorySyncGuard(const String & full_path)
     : fd(::open(full_path.c_str(), O_DIRECTORY))
 {
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + full_path, full_path,
-            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, full_path, "Cannot open file {}", full_path);
 }
 
 LocalDirectorySyncGuard::~LocalDirectorySyncGuard()
@@ -45,7 +45,7 @@ LocalDirectorySyncGuard::~LocalDirectorySyncGuard()
 
 #if defined(OS_DARWIN)
         if (fcntl(fd, F_FULLFSYNC, 0))
-            throwFromErrno("Cannot fcntl(F_FULLFSYNC)", ErrorCodes::CANNOT_FSYNC);
+            throw ErrnoException(ErrorCodes::CANNOT_FSYNC, "Cannot fcntl(F_FULLFSYNC)");
 #else
         if (-1 == ::fdatasync(fd))
             throw Exception(ErrorCodes::CANNOT_FSYNC, "Cannot fdatasync");
diff --git a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
index e459aae190c..742d735cc95 100644
--- a/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Cached/CachedObjectStorage.cpp
@@ -98,7 +98,7 @@ std::unique_ptr<WriteBufferFromFileBase> CachedObjectStorage::writeObject( /// N
     auto implementation_buffer = object_storage->writeObject(object, mode, attributes, buf_size, modified_write_settings);
 
     bool cache_on_write = modified_write_settings.enable_filesystem_cache_on_write_operations
-        && FileCacheFactory::instance().getByName(cache_config_name).settings.cache_on_write_operations
+        && FileCacheFactory::instance().getByName(cache_config_name)->getSettings().cache_on_write_operations
         && fs::path(object.remote_path).extension() != ".tmp";
 
     /// Need to remove even if cache_on_write == false.
diff --git a/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp b/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp
index 182326bbdc3..da01a82746f 100644
--- a/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp
+++ b/src/Disks/ObjectStorages/Cached/registerDiskCache.cpp
@@ -6,9 +6,8 @@
 #include <Common/filesystemHelpers.h>
 #include <Common/NamedCollections/NamedCollections.h>
 #include <Disks/DiskFactory.h>
-#include <Disks/ObjectStorages/Cached/CachedObjectStorage.h>
 #include <Disks/ObjectStorages/DiskObjectStorage.h>
-#include <Interpreters/Context.h>
+
 
 namespace DB
 {
@@ -65,7 +64,7 @@ void registerDiskCache(DiskFactory & factory, bool /* global_skip_access_check *
             }
         }
 
-        auto cache = FileCacheFactory::instance().getOrCreate(name, file_cache_settings);
+        auto cache = FileCacheFactory::instance().getOrCreate(name, file_cache_settings, predefined_configuration ? "" : config_prefix);
         auto disk = disk_it->second;
         if (!dynamic_cast<const DiskObjectStorage *>(disk.get()))
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.cpp b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
index af26f2dddd0..c3baf3fdbda 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.cpp
@@ -3,6 +3,7 @@
 #include <IO/ReadBufferFromString.h>
 #include <IO/ReadBufferFromEmptyFile.h>
 #include <IO/WriteBufferFromFile.h>
+#include <Common/formatReadable.h>
 #include <Common/CurrentThread.h>
 #include <Common/quoteString.h>
 #include <Common/logger_useful.h>
@@ -46,6 +47,17 @@ DiskTransactionPtr DiskObjectStorage::createObjectStorageTransaction()
         send_metadata ? metadata_helper.get() : nullptr);
 }
 
+DiskTransactionPtr DiskObjectStorage::createObjectStorageTransactionToAnotherDisk(DiskObjectStorage& to_disk)
+{
+    return std::make_shared<MultipleDisksObjectStorageTransaction>(
+        *object_storage,
+        *metadata_storage,
+        *to_disk.getObjectStorage(),
+        *to_disk.getMetadataStorage(),
+        send_metadata ? metadata_helper.get() : nullptr);
+}
+
+
 DiskObjectStorage::DiskObjectStorage(
     const String & name_,
     const String & object_key_prefix_,
@@ -179,12 +191,13 @@ void DiskObjectStorage::copyFile( /// NOLINT
     const std::function<void()> & cancellation_hook
     )
 {
-    if (this == &to_disk)
+    if (getDataSourceDescription() == to_disk.getDataSourceDescription())
     {
-        /// It may use s3-server-side copy
-        auto transaction = createObjectStorageTransaction();
-        transaction->copyFile(from_file_path, to_file_path);
-        transaction->commit();
+            /// It may use s3-server-side copy
+            auto & to_disk_object_storage = dynamic_cast<DiskObjectStorage &>(to_disk);
+            auto transaction = createObjectStorageTransactionToAnotherDisk(to_disk_object_storage);
+            transaction->copyFile(from_file_path, to_file_path);
+            transaction->commit();
     }
     else
     {
diff --git a/src/Disks/ObjectStorages/DiskObjectStorage.h b/src/Disks/ObjectStorages/DiskObjectStorage.h
index 25b39c4d974..acc1591f8a9 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorage.h
+++ b/src/Disks/ObjectStorages/DiskObjectStorage.h
@@ -222,6 +222,7 @@ private:
     /// Create actual disk object storage transaction for operations
     /// execution.
     DiskTransactionPtr createObjectStorageTransaction();
+    DiskTransactionPtr createObjectStorageTransactionToAnotherDisk(DiskObjectStorage& to_disk);
 
     String getReadResourceName() const;
     String getWriteResourceName() const;
diff --git a/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp b/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp
index 83a229c3533..5958762fa09 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp
+++ b/src/Disks/ObjectStorages/DiskObjectStorageTransaction.cpp
@@ -38,6 +38,29 @@ DiskObjectStorageTransaction::DiskObjectStorageTransaction(
     , metadata_helper(metadata_helper_)
 {}
 
+
+DiskObjectStorageTransaction::DiskObjectStorageTransaction(
+    IObjectStorage & object_storage_,
+    IMetadataStorage & metadata_storage_,
+    DiskObjectStorageRemoteMetadataRestoreHelper * metadata_helper_,
+    MetadataTransactionPtr metadata_transaction_)
+    : object_storage(object_storage_)
+    , metadata_storage(metadata_storage_)
+    , metadata_transaction(metadata_transaction_)
+    , metadata_helper(metadata_helper_)
+{}
+
+MultipleDisksObjectStorageTransaction::MultipleDisksObjectStorageTransaction(
+    IObjectStorage & object_storage_,
+    IMetadataStorage & metadata_storage_,
+    IObjectStorage& destination_object_storage_,
+    IMetadataStorage& destination_metadata_storage_,
+    DiskObjectStorageRemoteMetadataRestoreHelper * metadata_helper_)
+    : DiskObjectStorageTransaction(object_storage_, metadata_storage_, metadata_helper_, destination_metadata_storage_.createTransaction())
+    , destination_object_storage(destination_object_storage_)
+    , destination_metadata_storage(destination_metadata_storage_)
+{}
+
 namespace
 {
 /// Operation which affects only metadata. Simplest way to
@@ -485,10 +508,12 @@ struct CopyFileObjectStorageOperation final : public IDiskObjectStorageOperation
     std::string to_path;
 
     StoredObjects created_objects;
+    IObjectStorage& destination_object_storage;
 
     CopyFileObjectStorageOperation(
         IObjectStorage & object_storage_,
         IMetadataStorage & metadata_storage_,
+        IObjectStorage & destination_object_storage_,
         const ReadSettings & read_settings_,
         const WriteSettings & write_settings_,
         const std::string & from_path_,
@@ -498,6 +523,7 @@ struct CopyFileObjectStorageOperation final : public IDiskObjectStorageOperation
         , write_settings(write_settings_)
         , from_path(from_path_)
         , to_path(to_path_)
+        , destination_object_storage(destination_object_storage_)
     {}
 
     std::string getInfoForLog() const override
@@ -515,7 +541,7 @@ struct CopyFileObjectStorageOperation final : public IDiskObjectStorageOperation
             auto object_key = object_storage.generateObjectKeyForPath(to_path);
             auto object_to = StoredObject(object_key.serialize());
 
-            object_storage.copyObject(object_from, object_to, read_settings, write_settings);
+            object_storage.copyObjectToAnotherObjectStorage(object_from, object_to,read_settings,write_settings, destination_object_storage);
 
             tx->addBlobToMetadata(to_path, object_key, object_from.bytes_size);
 
@@ -526,7 +552,7 @@ struct CopyFileObjectStorageOperation final : public IDiskObjectStorageOperation
     void undo() override
     {
         for (const auto & object : created_objects)
-            object_storage.removeObject(object);
+            destination_object_storage.removeObject(object);
     }
 
     void finalize() override
@@ -859,7 +885,13 @@ void DiskObjectStorageTransaction::createFile(const std::string & path)
 void DiskObjectStorageTransaction::copyFile(const std::string & from_file_path, const std::string & to_file_path, const ReadSettings & read_settings, const WriteSettings & write_settings)
 {
     operations_to_execute.emplace_back(
-        std::make_unique<CopyFileObjectStorageOperation>(object_storage, metadata_storage, read_settings, write_settings, from_file_path, to_file_path));
+        std::make_unique<CopyFileObjectStorageOperation>(object_storage, metadata_storage, object_storage, read_settings, write_settings, from_file_path, to_file_path));
+}
+
+void MultipleDisksObjectStorageTransaction::copyFile(const std::string & from_file_path, const std::string & to_file_path, const ReadSettings & read_settings, const WriteSettings & write_settings)
+{
+    operations_to_execute.emplace_back(
+        std::make_unique<CopyFileObjectStorageOperation>(object_storage, metadata_storage, destination_object_storage, read_settings, write_settings, from_file_path, to_file_path));
 }
 
 void DiskObjectStorageTransaction::commit()
diff --git a/src/Disks/ObjectStorages/DiskObjectStorageTransaction.h b/src/Disks/ObjectStorages/DiskObjectStorageTransaction.h
index 4b62a41e161..67044751b84 100644
--- a/src/Disks/ObjectStorages/DiskObjectStorageTransaction.h
+++ b/src/Disks/ObjectStorages/DiskObjectStorageTransaction.h
@@ -50,9 +50,9 @@ using DiskObjectStorageOperations = std::vector<DiskObjectStorageOperation>;
 ///
 /// If something wrong happen on step 1 or 2 reverts all applied operations.
 /// If finalize failed -- nothing is reverted, garbage is left in blob storage.
-struct DiskObjectStorageTransaction final : public IDiskTransaction, std::enable_shared_from_this<DiskObjectStorageTransaction>
+struct DiskObjectStorageTransaction : public IDiskTransaction, std::enable_shared_from_this<DiskObjectStorageTransaction>
 {
-private:
+protected:
     IObjectStorage & object_storage;
     IMetadataStorage & metadata_storage;
 
@@ -63,6 +63,12 @@ private:
 
     DiskObjectStorageOperations operations_to_execute;
 
+    DiskObjectStorageTransaction(
+        IObjectStorage & object_storage_,
+        IMetadataStorage & metadata_storage_,
+        DiskObjectStorageRemoteMetadataRestoreHelper * metadata_helper_,
+        MetadataTransactionPtr metadata_transaction_);
+
 public:
     DiskObjectStorageTransaction(
         IObjectStorage & object_storage_,
@@ -118,6 +124,21 @@ public:
     void createHardLink(const std::string & src_path, const std::string & dst_path) override;
 };
 
+struct MultipleDisksObjectStorageTransaction final : public DiskObjectStorageTransaction, std::enable_shared_from_this<MultipleDisksObjectStorageTransaction>
+{
+    IObjectStorage& destination_object_storage;
+    IMetadataStorage& destination_metadata_storage;
+
+    MultipleDisksObjectStorageTransaction(
+        IObjectStorage & object_storage_,
+        IMetadataStorage & metadata_storage_,
+        IObjectStorage& destination_object_storage,
+        IMetadataStorage& destination_metadata_storage,
+        DiskObjectStorageRemoteMetadataRestoreHelper * metadata_helper_);
+
+    void copyFile(const std::string & from_file_path, const std::string & to_file_path, const ReadSettings & read_settings, const WriteSettings &) override;
+};
+
 using DiskObjectStorageTransactionPtr = std::shared_ptr<DiskObjectStorageTransaction>;
 
 }
diff --git a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
index 4cf3c23d5a6..c20a27e2384 100644
--- a/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Local/LocalObjectStorage.cpp
@@ -141,7 +141,7 @@ void LocalObjectStorage::removeObject(const StoredObject & object)
         return;
 
     if (0 != unlink(object.remote_path.data()))
-        throwFromErrnoWithPath("Cannot unlink file " + object.remote_path, object.remote_path, ErrorCodes::CANNOT_UNLINK);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_UNLINK, object.remote_path, "Cannot unlink file {}", object.remote_path);
 }
 
 void LocalObjectStorage::removeObjects(const StoredObjects & objects)
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
index a84d4c8f4a1..beb8a400632 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.cpp
@@ -458,27 +458,39 @@ void S3ObjectStorage::copyObjectToAnotherObjectStorage( // NOLINT
     /// Shortcut for S3
     if (auto * dest_s3 = dynamic_cast<S3ObjectStorage * >(&object_storage_to); dest_s3 != nullptr)
     {
-        auto client_ = client.get();
+        auto client_ = dest_s3->client.get();
         auto settings_ptr = s3_settings.get();
         auto size = S3::getObjectSize(*client_, bucket, object_from.remote_path, {}, settings_ptr->request_settings, /* for_disk_s3= */ true);
         auto scheduler = threadPoolCallbackRunner<void>(getThreadPoolWriter(), "S3ObjStor_copy");
-        copyS3File(
-            client.get(),
-            bucket,
-            object_from.remote_path,
-            0,
-            size,
-            dest_s3->bucket,
-            object_to.remote_path,
-            settings_ptr->request_settings,
-            patchSettings(read_settings),
-            BlobStorageLogWriter::create(disk_name),
-            object_to_attributes,
-            scheduler,
-            /* for_disk_s3= */ true);
+        try {
+            copyS3File(
+                client_,
+                bucket,
+                object_from.remote_path,
+                0,
+                size,
+                dest_s3->bucket,
+                object_to.remote_path,
+                settings_ptr->request_settings,
+                patchSettings(read_settings),
+                BlobStorageLogWriter::create(disk_name),
+                object_to_attributes,
+                scheduler,
+                /* for_disk_s3= */ true);
+            return;
+        }
+        catch (S3Exception & exc)
+        {
+            /// If authentication/permissions error occurs then fallthrough to copy with buffer.
+            if (exc.getS3ErrorCode() != Aws::S3::S3Errors::ACCESS_DENIED)
+                throw;
+            LOG_WARNING(&Poco::Logger::get("S3ObjectStorage"),
+                "S3-server-side copy object from the disk {} to the disk {} can not be performed: {}\n",
+                getName(), dest_s3->getName(), exc.what());
+        }
     }
-    else
-        IObjectStorage::copyObjectToAnotherObjectStorage(object_from, object_to, read_settings, write_settings, object_storage_to, object_to_attributes);
+
+    IObjectStorage::copyObjectToAnotherObjectStorage(object_from, object_to, read_settings, write_settings, object_storage_to, object_to_attributes);
 }
 
 void S3ObjectStorage::copyObject( // NOLINT
diff --git a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
index fdf82430812..c8b3aeaca28 100644
--- a/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
+++ b/src/Disks/ObjectStorages/S3/S3ObjectStorage.h
@@ -22,11 +22,13 @@ struct S3ObjectStorageSettings
         const S3Settings::RequestSettings & request_settings_,
         uint64_t min_bytes_for_seek_,
         int32_t list_object_keys_size_,
-        int32_t objects_chunk_size_to_delete_)
+        int32_t objects_chunk_size_to_delete_,
+        bool read_only_)
         : request_settings(request_settings_)
         , min_bytes_for_seek(min_bytes_for_seek_)
         , list_object_keys_size(list_object_keys_size_)
         , objects_chunk_size_to_delete(objects_chunk_size_to_delete_)
+        , read_only(read_only_)
     {}
 
     S3Settings::RequestSettings request_settings;
@@ -34,6 +36,7 @@ struct S3ObjectStorageSettings
     uint64_t min_bytes_for_seek;
     int32_t list_object_keys_size;
     int32_t objects_chunk_size_to_delete;
+    bool read_only;
 };
 
 
@@ -166,6 +169,8 @@ public:
 
     ObjectStorageKey generateObjectKeyForPath(const std::string & path) const override;
 
+    bool isReadOnly() const override { return s3_settings.get()->read_only; }
+
 private:
     void setNewSettings(std::unique_ptr<S3ObjectStorageSettings> && s3_settings_);
 
diff --git a/src/Disks/ObjectStorages/S3/diskSettings.cpp b/src/Disks/ObjectStorages/S3/diskSettings.cpp
index 0232a6eb070..8ea559be5ba 100644
--- a/src/Disks/ObjectStorages/S3/diskSettings.cpp
+++ b/src/Disks/ObjectStorages/S3/diskSettings.cpp
@@ -1,4 +1,5 @@
 #include <Disks/ObjectStorages/S3/diskSettings.h>
+#include "IO/S3/Client.h"
 
 #if USE_AWS_S3
 
@@ -34,7 +35,8 @@ std::unique_ptr<S3ObjectStorageSettings> getSettings(const Poco::Util::AbstractC
         request_settings,
         config.getUInt64(config_prefix + ".min_bytes_for_seek", 1024 * 1024),
         config.getInt(config_prefix + ".list_object_keys_size", 1000),
-        config.getInt(config_prefix + ".objects_chunk_size_to_delete", 1000));
+        config.getInt(config_prefix + ".objects_chunk_size_to_delete", 1000),
+        config.getBool(config_prefix + ".readonly", false));
 }
 
 std::unique_ptr<S3::Client> getClient(
@@ -43,6 +45,9 @@ std::unique_ptr<S3::Client> getClient(
     ContextPtr context,
     const S3ObjectStorageSettings & settings)
 {
+    const Settings & global_settings = context->getGlobalContext()->getSettingsRef();
+    const Settings & local_settings = context->getSettingsRef();
+
     String endpoint = context->getMacros()->expand(config.getString(config_prefix + ".endpoint"));
     S3::URI uri(endpoint);
     if (!uri.key.ends_with('/'))
@@ -51,17 +56,17 @@ std::unique_ptr<S3::Client> getClient(
     S3::PocoHTTPClientConfiguration client_configuration = S3::ClientFactory::instance().createClientConfiguration(
         config.getString(config_prefix + ".region", ""),
         context->getRemoteHostFilter(),
-        static_cast<int>(context->getGlobalContext()->getSettingsRef().s3_max_redirects),
-        static_cast<int>(context->getGlobalContext()->getSettingsRef().s3_retry_attempts),
-        context->getGlobalContext()->getSettingsRef().enable_s3_requests_logging,
+        static_cast<int>(global_settings.s3_max_redirects),
+        static_cast<int>(global_settings.s3_retry_attempts),
+        global_settings.enable_s3_requests_logging,
         /* for_disk_s3 = */ true,
         settings.request_settings.get_request_throttler,
         settings.request_settings.put_request_throttler,
         uri.uri.getScheme());
 
-    client_configuration.connectTimeoutMs = config.getUInt(config_prefix + ".connect_timeout_ms", 1000);
-    client_configuration.requestTimeoutMs = config.getUInt(config_prefix + ".request_timeout_ms", 30000);
-    client_configuration.maxConnections = config.getUInt(config_prefix + ".max_connections", 100);
+    client_configuration.connectTimeoutMs = config.getUInt(config_prefix + ".connect_timeout_ms", S3::DEFAULT_CONNECT_TIMEOUT_MS);
+    client_configuration.requestTimeoutMs = config.getUInt(config_prefix + ".request_timeout_ms", S3::DEFAULT_REQUEST_TIMEOUT_MS);
+    client_configuration.maxConnections = config.getUInt(config_prefix + ".max_connections", S3::DEFAULT_MAX_CONNECTIONS);
     client_configuration.endpointOverride = uri.endpoint;
     client_configuration.http_keep_alive_timeout_ms = config.getUInt(
         config_prefix + ".http_keep_alive_timeout_ms", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT * 1000);
@@ -89,13 +94,15 @@ std::unique_ptr<S3::Client> getClient(
     HTTPHeaderEntries headers = S3::getHTTPHeaders(config_prefix, config);
     S3::ServerSideEncryptionKMSConfig sse_kms_config = S3::getSSEKMSConfig(config_prefix, config);
 
-    client_configuration.retryStrategy
-        = std::make_shared<Aws::Client::DefaultRetryStrategy>(
-            config.getUInt64(config_prefix + ".retry_attempts", settings.request_settings.retry_attempts));
+    S3::ClientSettings client_settings{
+        .use_virtual_addressing = uri.is_virtual_hosted_style,
+        .disable_checksum = local_settings.s3_disable_checksum,
+        .gcs_issue_compose_request = config.getBool("s3.gcs_issue_compose_request", false),
+    };
 
     return S3::ClientFactory::instance().create(
         client_configuration,
-        uri.is_virtual_hosted_style,
+        client_settings,
         config.getString(config_prefix + ".access_key_id", ""),
         config.getString(config_prefix + ".secret_access_key", ""),
         config.getString(config_prefix + ".server_side_encryption_customer_key_base64", ""),
diff --git a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
index 0103188b562..f3b0cb8b9a0 100644
--- a/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
+++ b/src/Disks/ObjectStorages/Web/WebObjectStorage.cpp
@@ -47,7 +47,7 @@ void WebObjectStorage::initialize(const String & uri_path, const std::unique_loc
             ReadWriteBufferFromHTTP::OutStreamCallback(),
             ConnectionTimeouts::getHTTPTimeouts(
                 getContext()->getSettingsRef(),
-                {getContext()->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0}),
+                getContext()->getServerSettings().keep_alive_timeout),
             credentials,
             /* max_redirects= */ 0,
             /* buffer_size_= */ DBMS_DEFAULT_BUFFER_SIZE,
diff --git a/src/Formats/EscapingRuleUtils.cpp b/src/Formats/EscapingRuleUtils.cpp
index d429985e52a..9cc7cb3b89e 100644
--- a/src/Formats/EscapingRuleUtils.cpp
+++ b/src/Formats/EscapingRuleUtils.cpp
@@ -303,8 +303,8 @@ DataTypePtr tryInferDataTypeByEscapingRule(const String & field, const FormatSet
                 /// Try to determine the type of value inside quotes
                 auto type = tryInferDataTypeForSingleField(data, format_settings);
 
-                /// If we couldn't infer any type or it's a number or tuple in quotes, we determine it as a string.
-                if (!type || isNumber(removeNullable(type)) || isTuple(type))
+                /// If we couldn't infer any type or it's tuple in quotes or it's a number and csv.try_infer_numbers_from_strings = 0, we determine it as a string.
+                if (!type || isTuple(type) || (isNumber(type) && !format_settings.csv.try_infer_numbers_from_strings))
                     return std::make_shared<DataTypeString>();
 
                 return type;
diff --git a/src/Formats/FormatFactory.cpp b/src/Formats/FormatFactory.cpp
index b2ff9b1c3f7..15743365d7d 100644
--- a/src/Formats/FormatFactory.cpp
+++ b/src/Formats/FormatFactory.cpp
@@ -74,6 +74,7 @@ FormatSettings getFormatSettings(ContextPtr context, const Settings & settings)
     format_settings.csv.allow_whitespace_or_tab_as_delimiter = settings.input_format_csv_allow_whitespace_or_tab_as_delimiter;
     format_settings.csv.allow_variable_number_of_columns = settings.input_format_csv_allow_variable_number_of_columns;
     format_settings.csv.use_default_on_bad_values = settings.input_format_csv_use_default_on_bad_values;
+    format_settings.csv.try_infer_numbers_from_strings = settings.input_format_csv_try_infer_numbers_from_strings;
     format_settings.hive_text.fields_delimiter = settings.input_format_hive_text_fields_delimiter;
     format_settings.hive_text.collection_items_delimiter = settings.input_format_hive_text_collection_items_delimiter;
     format_settings.hive_text.map_keys_delimiter = settings.input_format_hive_text_map_keys_delimiter;
@@ -347,7 +348,13 @@ InputFormatPtr FormatFactory::getInput(
     if (owned_buf)
         format->addBuffer(std::move(owned_buf));
     if (!settings.input_format_record_errors_file_path.toString().empty())
-        format->setErrorsLogger(std::make_shared<ParallelInputFormatErrorsLogger>(context));
+    {
+        if (parallel_parsing)
+            format->setErrorsLogger(std::make_shared<ParallelInputFormatErrorsLogger>(context));
+        else
+            format->setErrorsLogger(std::make_shared<InputFormatErrorsLogger>(context));
+    }
+
 
     /// It's a kludge. Because I cannot remove context from values format.
     /// (Not needed in the parallel_parsing case above because VALUES format doesn't support it.)
diff --git a/src/Formats/FormatSettings.h b/src/Formats/FormatSettings.h
index d9e3a420502..8d5c044a311 100644
--- a/src/Formats/FormatSettings.h
+++ b/src/Formats/FormatSettings.h
@@ -164,6 +164,7 @@ struct FormatSettings
         bool allow_whitespace_or_tab_as_delimiter = false;
         bool allow_variable_number_of_columns = false;
         bool use_default_on_bad_values = false;
+        bool try_infer_numbers_from_strings = true;
     } csv;
 
     struct HiveText
diff --git a/src/Formats/JSONUtils.cpp b/src/Formats/JSONUtils.cpp
index 349945bbd54..779f38032d8 100644
--- a/src/Formats/JSONUtils.cpp
+++ b/src/Formats/JSONUtils.cpp
@@ -24,7 +24,6 @@ namespace ErrorCodes
 
 namespace JSONUtils
 {
-
     template <const char opening_bracket, const char closing_bracket>
     static std::pair<bool, size_t>
     fileSegmentationEngineJSONEachRowImpl(ReadBuffer & in, DB::Memory<> & memory, size_t min_bytes, size_t min_rows, size_t max_rows)
@@ -44,7 +43,7 @@ namespace JSONUtils
         {
             const auto current_object_size = memory.size() + static_cast<size_t>(pos - in.position());
             if (min_bytes != 0 && current_object_size > 10 * min_bytes)
-                throw ParsingException(ErrorCodes::INCORRECT_DATA,
+                throw Exception(ErrorCodes::INCORRECT_DATA,
                     "Size of JSON object at position {} is extremely large. Expected not greater than {} bytes, but current is {} bytes per row. "
                     "Increase the value setting 'min_chunk_bytes_for_parallel_parsing' or check your data manually, "
                     "most likely JSON is malformed", in.count(), min_bytes, current_object_size);
@@ -72,7 +71,7 @@ namespace JSONUtils
             }
             else
             {
-                pos = find_first_symbols<opening_bracket, closing_bracket, '\\', '"'>(pos, in.buffer().end());
+                pos = find_first_symbols<opening_bracket, closing_bracket, '"'>(pos, in.buffer().end());
 
                 if (pos > in.buffer().end())
                     throw Exception(ErrorCodes::LOGICAL_ERROR, "Position in buffer is out of bounds. There must be a bug.");
@@ -89,19 +88,13 @@ namespace JSONUtils
                     --balance;
                     ++pos;
                 }
-                else if (*pos == '\\')
-                {
-                    ++pos;
-                    if (loadAtPosition(in, memory, pos))
-                        ++pos;
-                }
                 else if (*pos == '"')
                 {
                     quotes = true;
                     ++pos;
                 }
 
-                if (balance == 0)
+                if (!quotes && balance == 0)
                 {
                     ++number_of_rows;
                     if ((number_of_rows >= min_rows)
@@ -115,13 +108,14 @@ namespace JSONUtils
         return {loadAtPosition(in, memory, pos), number_of_rows};
     }
 
-    std::pair<bool, size_t> fileSegmentationEngineJSONEachRow(ReadBuffer & in, DB::Memory<> & memory, size_t min_bytes, size_t max_rows)
+    std::pair<bool, size_t> fileSegmentationEngineJSONEachRow(
+        ReadBuffer & in, DB::Memory<> & memory, size_t min_bytes, size_t max_rows)
     {
         return fileSegmentationEngineJSONEachRowImpl<'{', '}'>(in, memory, min_bytes, 1, max_rows);
     }
 
-    std::pair<bool, size_t>
-    fileSegmentationEngineJSONCompactEachRow(ReadBuffer & in, DB::Memory<> & memory, size_t min_bytes, size_t min_rows, size_t max_rows)
+    std::pair<bool, size_t> fileSegmentationEngineJSONCompactEachRow(
+        ReadBuffer & in, DB::Memory<> & memory, size_t min_bytes, size_t min_rows, size_t max_rows)
     {
         return fileSegmentationEngineJSONEachRowImpl<'[', ']'>(in, memory, min_bytes, min_rows, max_rows);
     }
@@ -564,6 +558,15 @@ namespace JSONUtils
         skipWhitespaceIfAny(in);
     }
 
+    bool checkAndSkipColon(ReadBuffer & in)
+    {
+        skipWhitespaceIfAny(in);
+        if (!checkChar(':', in))
+            return false;
+        skipWhitespaceIfAny(in);
+        return true;
+    }
+
     String readFieldName(ReadBuffer & in)
     {
         skipWhitespaceIfAny(in);
@@ -573,6 +576,12 @@ namespace JSONUtils
         return field;
     }
 
+    bool tryReadFieldName(ReadBuffer & in, String & field)
+    {
+        skipWhitespaceIfAny(in);
+        return tryReadJSONStringInto(field, in) && checkAndSkipColon(in);
+    }
+
     String readStringField(ReadBuffer & in)
     {
         skipWhitespaceIfAny(in);
@@ -582,6 +591,15 @@ namespace JSONUtils
         return value;
     }
 
+    bool tryReadStringField(ReadBuffer & in, String & value)
+    {
+        skipWhitespaceIfAny(in);
+        if (!tryReadJSONStringInto(value, in))
+            return false;
+        skipWhitespaceIfAny(in);
+        return true;
+    }
+
     void skipArrayStart(ReadBuffer & in)
     {
         skipWhitespaceIfAny(in);
@@ -628,6 +646,15 @@ namespace JSONUtils
         skipWhitespaceIfAny(in);
     }
 
+    bool checkAndSkipObjectStart(ReadBuffer & in)
+    {
+        skipWhitespaceIfAny(in);
+        if (!checkChar('{', in))
+            return false;
+        skipWhitespaceIfAny(in);
+        return true;
+    }
+
     bool checkAndSkipObjectEnd(ReadBuffer & in)
     {
         skipWhitespaceIfAny(in);
@@ -644,6 +671,15 @@ namespace JSONUtils
         skipWhitespaceIfAny(in);
     }
 
+    bool checkAndSkipComma(ReadBuffer & in)
+    {
+        skipWhitespaceIfAny(in);
+        if (!checkChar(',', in))
+            return false;
+        skipWhitespaceIfAny(in);
+        return true;
+    }
+
     std::pair<String, String> readStringFieldNameAndValue(ReadBuffer & in)
     {
         auto field_name = readFieldName(in);
@@ -651,6 +687,11 @@ namespace JSONUtils
         return {field_name, field_value};
     }
 
+    bool tryReadStringFieldNameAndValue(ReadBuffer & in, std::pair<String, String> & field_and_value)
+    {
+        return tryReadFieldName(in, field_and_value.first) && tryReadStringField(in, field_and_value.second);
+    }
+
     NameAndTypePair readObjectWithNameAndType(ReadBuffer & in)
     {
         skipObjectStart(in);
@@ -673,6 +714,44 @@ namespace JSONUtils
         return name_and_type;
     }
 
+    bool tryReadObjectWithNameAndType(ReadBuffer & in, NameAndTypePair & name_and_type)
+    {
+        if (!checkAndSkipObjectStart(in))
+            return false;
+
+        std::pair<String, String> first_field_and_value;
+        if (!tryReadStringFieldNameAndValue(in, first_field_and_value))
+            return false;
+
+        if (!checkAndSkipComma(in))
+            return false;
+
+        std::pair<String, String> second_field_and_value;
+        if (!tryReadStringFieldNameAndValue(in, second_field_and_value))
+            return false;
+
+        if (first_field_and_value.first == "name" && second_field_and_value.first == "type")
+        {
+            auto type = DataTypeFactory::instance().tryGet(second_field_and_value.second);
+            if (!type)
+                return false;
+            name_and_type = {first_field_and_value.second, type};
+        }
+        else if (second_field_and_value.first == "name" && first_field_and_value.first == "type")
+        {
+            auto type = DataTypeFactory::instance().tryGet(first_field_and_value.second);
+            if (!type)
+                return false;
+            name_and_type = {second_field_and_value.second, type};
+        }
+        else
+        {
+            return false;
+        }
+
+        return checkAndSkipObjectEnd(in);
+    }
+
     NamesAndTypesList readMetadata(ReadBuffer & in)
     {
         auto field_name = readFieldName(in);
@@ -693,6 +772,37 @@ namespace JSONUtils
         return names_and_types;
     }
 
+    bool tryReadMetadata(ReadBuffer & in, NamesAndTypesList & names_and_types)
+    {
+        String field_name;
+        if (!tryReadFieldName(in, field_name) || field_name != "meta")
+            return false;
+
+        if (!checkAndSkipArrayStart(in))
+            return false;
+
+        bool first = true;
+        while (!checkAndSkipArrayEnd(in))
+        {
+            if (!first)
+            {
+                if (!checkAndSkipComma(in))
+                    return false;
+            }
+            else
+            {
+                first = false;
+            }
+
+            NameAndTypePair name_and_type;
+            if (!tryReadObjectWithNameAndType(in, name_and_type))
+                return false;
+            names_and_types.push_back(name_and_type);
+        }
+
+        return !names_and_types.empty();
+    }
+
     void validateMetadataByHeader(const NamesAndTypesList & names_and_types_from_metadata, const Block & header)
     {
         for (const auto & [name, type] : names_and_types_from_metadata)
diff --git a/src/Formats/JSONUtils.h b/src/Formats/JSONUtils.h
index cd6b5ff8171..a770ded9687 100644
--- a/src/Formats/JSONUtils.h
+++ b/src/Formats/JSONUtils.h
@@ -112,6 +112,7 @@ namespace JSONUtils
 
     void skipColon(ReadBuffer & in);
     void skipComma(ReadBuffer & in);
+    bool checkAndSkipComma(ReadBuffer & in);
 
     String readFieldName(ReadBuffer & in);
 
@@ -122,9 +123,11 @@ namespace JSONUtils
 
     void skipObjectStart(ReadBuffer & in);
     void skipObjectEnd(ReadBuffer & in);
+    bool checkAndSkipObjectStart(ReadBuffer & in);
     bool checkAndSkipObjectEnd(ReadBuffer & in);
 
     NamesAndTypesList readMetadata(ReadBuffer & in);
+    bool tryReadMetadata(ReadBuffer & in, NamesAndTypesList & names_and_types);
     NamesAndTypesList readMetadataAndValidateHeader(ReadBuffer & in, const Block & header);
     void validateMetadataByHeader(const NamesAndTypesList & names_and_types_from_metadata, const Block & header);
 
diff --git a/src/Formats/MarkInCompressedFile.h b/src/Formats/MarkInCompressedFile.h
index 08e4f182c45..a25033e2a14 100644
--- a/src/Formats/MarkInCompressedFile.h
+++ b/src/Formats/MarkInCompressedFile.h
@@ -10,6 +10,13 @@
 namespace DB
 {
 
+/// It's a bug in clang with three-way comparison operator
+/// https://github.com/llvm/llvm-project/issues/55919
+#ifdef __clang__
+    #pragma clang diagnostic push
+    #pragma clang diagnostic ignored "-Wzero-as-null-pointer-constant"
+#endif
+
 /** Mark is the position in the compressed file. The compressed file consists of adjacent compressed blocks.
   * Mark is a tuple - the offset in the file to the start of the compressed block, the offset in the decompressed block to the start of the data.
   */
@@ -18,12 +25,7 @@ struct MarkInCompressedFile
     size_t offset_in_compressed_file;
     size_t offset_in_decompressed_block;
 
-    bool operator==(const MarkInCompressedFile & rhs) const
-    {
-        return std::tie(offset_in_compressed_file, offset_in_decompressed_block)
-            == std::tie(rhs.offset_in_compressed_file, rhs.offset_in_decompressed_block);
-    }
-    bool operator!=(const MarkInCompressedFile & rhs) const { return !(*this == rhs); }
+    auto operator<=>(const MarkInCompressedFile &) const = default;
 
     auto asTuple() const { return std::make_tuple(offset_in_compressed_file, offset_in_decompressed_block); }
 
@@ -39,6 +41,10 @@ struct MarkInCompressedFile
     }
 };
 
+#ifdef __clang__
+    #pragma clang diagnostic pop
+#endif
+
 /**
  * In-memory representation of an array of marks.
  *
diff --git a/src/Formats/NativeReader.cpp b/src/Formats/NativeReader.cpp
index 4c25460eb63..8286b24d0a6 100644
--- a/src/Formats/NativeReader.cpp
+++ b/src/Formats/NativeReader.cpp
@@ -120,7 +120,7 @@ Block NativeReader::read()
     if (istr.eof())
     {
         if (use_index)
-            throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Input doesn't contain all data for index.");
+            throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Input doesn't contain all data for index.");
 
         return res;
     }
diff --git a/src/Formats/ReadSchemaUtils.cpp b/src/Formats/ReadSchemaUtils.cpp
index b185007eda7..43931be3449 100644
--- a/src/Formats/ReadSchemaUtils.cpp
+++ b/src/Formats/ReadSchemaUtils.cpp
@@ -1,12 +1,9 @@
-#include <DataTypes/DataTypeMap.h>
 #include <Formats/ReadSchemaUtils.h>
 #include <Interpreters/Context.h>
 #include <Processors/Formats/ISchemaReader.h>
-#include <Storages/IStorage.h>
 #include <Common/assert_cast.h>
-#include <IO/WithFileName.h>
 #include <IO/WithFileSize.h>
-
+#include <IO/EmptyReadBuffer.h>
 
 namespace DB
 {
@@ -17,6 +14,7 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int ONLY_NULLS_WHILE_READING_SCHEMA;
     extern const int CANNOT_EXTRACT_TABLE_STRUCTURE;
+    extern const int TYPE_MISMATCH;
 }
 
 static std::optional<NamesAndTypesList> getOrderedColumnsList(const NamesAndTypesList & columns_list, const Names & columns_order_hint)
@@ -55,6 +53,17 @@ ColumnsDescription readSchemaFromFormat(
 try
 {
     NamesAndTypesList names_and_types;
+    SchemaInferenceMode mode = context->getSettingsRef().schema_inference_mode;
+    if (mode == SchemaInferenceMode::UNION && !FormatFactory::instance().checkIfFormatSupportsSubsetOfColumns(format_name, context, format_settings))
+    {
+        String additional_message;
+        /// Better exception message for WithNames(AndTypes) formats.
+        if (format_name.ends_with("WithNames") || format_name.ends_with("WithNamesAndTypes"))
+            additional_message = " (formats -WithNames(AndTypes) support reading subset of columns only when setting input_format_with_names_use_header is enabled)";
+
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "UNION schema inference mode is not supported for format {}, because it doesn't support reading subset of columns{}", format_name, additional_message);
+    }
+
     if (FormatFactory::instance().checkIfFormatHasExternalSchemaReader(format_name))
     {
         auto external_schema_reader = FormatFactory::instance().getExternalSchemaReader(format_name, context, format_settings);
@@ -71,6 +80,11 @@ try
     }
     else if (FormatFactory::instance().checkIfFormatHasSchemaReader(format_name))
     {
+        if (mode == SchemaInferenceMode::UNION)
+            retry = false;
+
+        std::vector<std::pair<NamesAndTypesList, String>> schemas_for_union_mode;
+        std::optional<ColumnsDescription> cached_columns;
         std::string exception_messages;
         SchemaReaderPtr schema_reader;
         size_t max_rows_to_read = format_settings ? format_settings->max_rows_to_read_for_schema_inference
@@ -84,7 +98,15 @@ try
             try
             {
                 read_buffer_iterator.setPreviousReadBuffer(std::move(buf));
-                buf = read_buffer_iterator.next();
+                std::tie(buf, cached_columns) = read_buffer_iterator.next();
+                if (cached_columns)
+                {
+                    if (mode == SchemaInferenceMode::DEFAULT)
+                        return *cached_columns;
+                    schemas_for_union_mode.emplace_back(cached_columns->getAll(), read_buffer_iterator.getLastFileName());
+                    continue;
+                }
+
                 if (!buf)
                     break;
 
@@ -136,12 +158,19 @@ try
                 auto num_rows = schema_reader->readNumberOrRows();
                 if (num_rows)
                     read_buffer_iterator.setNumRowsToLastFile(*num_rows);
-                break;
+
+                /// In default mode, we finish when schema is inferred successfully from any file.
+                if (mode == SchemaInferenceMode::DEFAULT)
+                    break;
+
+                if (!names_and_types.empty())
+                    read_buffer_iterator.setSchemaToLastFile(ColumnsDescription(names_and_types));
+                schemas_for_union_mode.emplace_back(names_and_types, read_buffer_iterator.getLastFileName());
             }
             catch (...)
             {
                 auto exception_message = getCurrentExceptionMessage(false);
-                if (schema_reader)
+                if (schema_reader && mode == SchemaInferenceMode::DEFAULT)
                 {
                     size_t rows_read = schema_reader->getNumRowsRead();
                     assert(rows_read <= max_rows_to_read);
@@ -190,8 +219,58 @@ try
             }
         }
 
-        if (auto cached_columns = read_buffer_iterator.getCachedColumns())
-            return *cached_columns;
+        /// If we got all schemas from cache, schema_reader can be uninitialized.
+        /// But we still need some stateless methods of ISchemaReader,
+        /// let's initialize it with empty buffer.
+        EmptyReadBuffer empty;
+        if (!schema_reader)
+            schema_reader = FormatFactory::instance().getSchemaReader(format_name, empty, context, format_settings);
+
+        if (mode == SchemaInferenceMode::UNION)
+        {
+            Names names_order; /// Try to save original columns order;
+            std::unordered_map<String, DataTypePtr> names_to_types;
+
+
+            for (const auto & [schema, file_name] : schemas_for_union_mode)
+            {
+                for (const auto & [name, type] : schema)
+                {
+                    auto it = names_to_types.find(name);
+                    if (it == names_to_types.end())
+                    {
+                        names_order.push_back(name);
+                        names_to_types[name] = type;
+                    }
+                    else
+                    {
+                        /// We already have column with such name.
+                        /// Check if types are the same.
+                        if (!type->equals(*it->second))
+                        {
+                            /// If types are not the same, try to transform them according
+                            /// to the format to find common type.
+                            auto new_type_copy = type;
+                            schema_reader->transformTypesFromDifferentFilesIfNeeded(it->second, new_type_copy);
+
+                            /// If types are not the same after transform, we cannot do anything, throw an exception.
+                            if (!it->second->equals(*new_type_copy))
+                                throw Exception(
+                                    ErrorCodes::TYPE_MISMATCH,
+                                    "Automatically inferred type {} for column '{}'{} differs from type inferred from previous files: {}",
+                                    type->getName(),
+                                    name,
+                                    file_name.empty() ? "" : " in file " + file_name,
+                                    it->second->getName());
+                        }
+                    }
+                }
+            }
+
+            names_and_types.clear();
+            for (const auto & name : names_order)
+                names_and_types.emplace_back(name, names_to_types[name]);
+        }
 
         if (names_and_types.empty())
             throw Exception(
@@ -206,7 +285,7 @@ try
         /// It will allow to execute simple data loading with query
         /// "INSERT INTO table SELECT * FROM ..."
         const auto & insertion_table = context->getInsertionTable();
-        if (!schema_reader->hasStrictOrderOfColumns() && !insertion_table.empty())
+        if (schema_reader && !schema_reader->hasStrictOrderOfColumns() && !insertion_table.empty())
         {
             auto storage = DatabaseCatalog::instance().getTable(insertion_table, context);
             auto metadata = storage->getInMemoryMetadataPtr();
@@ -226,13 +305,15 @@ try
     names_and_types.erase(
         std::remove_if(names_and_types.begin(), names_and_types.end(), [](const NameAndTypePair & pair) { return pair.name.empty(); }),
         names_and_types.end());
-    return ColumnsDescription(names_and_types);
+
+    auto columns = ColumnsDescription(names_and_types);
+    if (mode == SchemaInferenceMode::DEFAULT)
+        read_buffer_iterator.setResultingSchema(columns);
+    return columns;
 }
 catch (Exception & e)
 {
-    if (!buf)
-        throw;
-    auto file_name = getFileNameFromReadBuffer(*buf);
+    auto file_name = read_buffer_iterator.getLastFileName();
     if (!file_name.empty())
         e.addMessage(fmt::format("(in file/uri {})", file_name));
     throw;
@@ -256,9 +337,9 @@ SchemaCache::Key getKeyForSchemaCache(
     return getKeysForSchemaCache({source}, format, format_settings, context).front();
 }
 
-static SchemaCache::Key makeSchemaCacheKey(const String & source, const String & format, const String & additional_format_info)
+static SchemaCache::Key makeSchemaCacheKey(const String & source, const String & format, const String & additional_format_info, const String & schema_inference_mode)
 {
-    return SchemaCache::Key{source, format, additional_format_info};
+    return SchemaCache::Key{source, format, additional_format_info, schema_inference_mode};
 }
 
 SchemaCache::Keys getKeysForSchemaCache(
@@ -270,13 +351,14 @@ SchemaCache::Keys getKeysForSchemaCache(
     /// For example, for Protobuf format additional information is the path to the schema
     /// and message name.
     String additional_format_info = FormatFactory::instance().getAdditionalInfoForSchemaCache(format, context, format_settings);
+    String schema_inference_mode(magic_enum::enum_name(context->getSettingsRef().schema_inference_mode.value));
     SchemaCache::Keys cache_keys;
     cache_keys.reserve(sources.size());
     std::transform(
         sources.begin(),
         sources.end(),
         std::back_inserter(cache_keys),
-        [&](const auto & source) { return makeSchemaCacheKey(source, format, additional_format_info); });
+        [&](const auto & source) { return makeSchemaCacheKey(source, format, additional_format_info, schema_inference_mode); });
     return cache_keys;
 }
 
diff --git a/src/Formats/ReadSchemaUtils.h b/src/Formats/ReadSchemaUtils.h
index c769846acbb..6aa8f3f9c4c 100644
--- a/src/Formats/ReadSchemaUtils.h
+++ b/src/Formats/ReadSchemaUtils.h
@@ -13,11 +13,23 @@ struct IReadBufferIterator
 
     virtual void setPreviousReadBuffer(std::unique_ptr<ReadBuffer> /* buffer */) {}
 
-    virtual std::unique_ptr<ReadBuffer> next() = 0;
-
-    virtual std::optional<ColumnsDescription> getCachedColumns() { return std::nullopt; }
+    /// Return read buffer of the next file or cached schema.
+    /// In DEFAULT schema inference mode cached schema can be from any file.
+    /// In UNION mode cached schema can be only from current file.
+    /// When there is no files to process, return pair (nullptr, nullopt)
+    virtual std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() = 0;
 
     virtual void setNumRowsToLastFile(size_t /*num_rows*/) {}
+
+    /// Set schema inferred from last file. Used for UNION mode to cache schema
+    /// per file.
+    virtual void setSchemaToLastFile(const ColumnsDescription & /*columns*/) {}
+    /// Set resulting inferred schema. Used for DEFAULT mode to cache schema
+    /// for all files.
+    virtual void setResultingSchema(const ColumnsDescription & /*columns*/) {}
+
+    /// Get last processed file name for better exception messages.
+    virtual String getLastFileName() const { return ""; }
 };
 
 struct SingleReadBufferIterator : public IReadBufferIterator
@@ -27,12 +39,12 @@ public:
     {
     }
 
-    std::unique_ptr<ReadBuffer> next() override
+    std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
     {
         if (done)
-            return nullptr;
+            return {nullptr, {}};
         done = true;
-        return std::move(buf);
+        return {std::move(buf), {}};
     }
 
 private:
@@ -45,11 +57,18 @@ private:
 /// use it and won't create a read buffer.
 /// For formats that have a schema reader from the data,
 /// read buffer will be created by the provided iterator and
-/// the schema will be extracted from the data. If schema reader
-/// couldn't determine the schema we will try the next read buffer
-/// from the provided iterator if it makes sense. If the format doesn't
-/// have any schema reader or we couldn't determine the schema,
-/// an exception will be thrown.
+/// the schema will be extracted from the data. If the format doesn't
+/// have any schema reader an exception will be thrown.
+/// Reading schema can be performed in 2 modes depending on setting schema_inference_mode:
+/// 1) Default mode. In this mode ClickHouse assumes that all files have the same schema
+/// and tries to infer the schema by reading files one by one until it succeeds.
+/// If schema reader couldn't determine the schema for some file, ClickHouse will try the next
+/// file (next read buffer from the provided iterator) if it makes sense. If ClickHouse couldn't determine
+/// the resulting schema, an exception will be thrown.
+/// 2) Union mode. In this mode ClickHouse assumes that files can have different schemas,
+/// so it infer schemas of all files and then union them to the common schema. In this mode
+/// all read buffers from provided iterator will be used. If ClickHouse couldn't determine
+/// the schema for some file, an exception will be thrown.
 ColumnsDescription readSchemaFromFormat(
     const String & format_name,
     const std::optional<FormatSettings> & format_settings,
diff --git a/src/Formats/SchemaInferenceUtils.cpp b/src/Formats/SchemaInferenceUtils.cpp
index 94166aa9002..e2ba188d015 100644
--- a/src/Formats/SchemaInferenceUtils.cpp
+++ b/src/Formats/SchemaInferenceUtils.cpp
@@ -547,6 +547,54 @@ namespace
         }
     }
 
+    void mergeNamedTuples(DataTypes & data_types, TypeIndexesSet & type_indexes, const FormatSettings & settings, JSONInferenceInfo * json_info)
+    {
+        if (!type_indexes.contains(TypeIndex::Tuple))
+            return;
+
+        /// Collect all names and their types from all named tuples.
+        std::unordered_map<String, DataTypes> names_to_types;
+        /// Try to save original order of element names.
+        Names element_names;
+        for (auto & type : data_types)
+        {
+            const auto * tuple_type = typeid_cast<const DataTypeTuple *>(type.get());
+            if (tuple_type && tuple_type->haveExplicitNames())
+            {
+                const auto & elements = tuple_type->getElements();
+                const auto & names = tuple_type->getElementNames();
+                for (size_t i = 0; i != elements.size(); ++i)
+                {
+                    if (!names_to_types.contains(names[i]))
+                        element_names.push_back(names[i]);
+                    names_to_types[names[i]].push_back(elements[i]);
+                }
+            }
+        }
+
+        /// Try to find common type for each tuple element with the same name.
+        DataTypes element_types;
+        element_types.reserve(names_to_types.size());
+        for (const auto & name : element_names)
+        {
+            auto & types = names_to_types[name];
+            transformInferredTypesIfNeededImpl<true>(types, settings, json_info);
+            /// If some element have different types in different tuples, we can't do anything
+            if (!checkIfTypesAreEqual(types))
+                return;
+            element_types.push_back(types.front());
+        }
+
+        DataTypePtr result_tuple = std::make_shared<DataTypeTuple>(element_types, element_names);
+
+        for (auto & type : data_types)
+        {
+            const auto * tuple_type = typeid_cast<const DataTypeTuple *>(type.get());
+            if (tuple_type && tuple_type->haveExplicitNames())
+                type = result_tuple;
+        }
+    }
+
     template <bool is_json>
     void transformInferredTypesIfNeededImpl(DataTypes & types, const FormatSettings & settings, JSONInferenceInfo * json_info)
     {
@@ -604,6 +652,9 @@ namespace
 
             if (settings.json.read_objects_as_strings)
                 transformMapsAndStringsToStrings(data_types, type_indexes);
+
+            if (json_info && json_info->allow_merging_named_tuples)
+                mergeNamedTuples(data_types, type_indexes, settings, json_info);
         };
 
         transformTypesRecursively(types, transform_simple_types, transform_complex_types);
@@ -1180,6 +1231,13 @@ void transformInferredJSONTypesIfNeeded(
     second = std::move(types[1]);
 }
 
+void transformInferredJSONTypesFromDifferentFilesIfNeeded(DataTypePtr & first, DataTypePtr & second, const FormatSettings & settings)
+{
+    JSONInferenceInfo json_info;
+    json_info.allow_merging_named_tuples = true;
+    transformInferredJSONTypesIfNeeded(first, second, settings, &json_info);
+}
+
 void transformFinalInferredJSONTypeIfNeededImpl(DataTypePtr & data_type, const FormatSettings & settings, JSONInferenceInfo * json_info, bool remain_nothing_types = false)
 {
     if (!data_type)
@@ -1247,11 +1305,22 @@ void transformFinalInferredJSONTypeIfNeededImpl(DataTypePtr & data_type, const F
             return;
         }
 
+        /// First, try to transform nested types without final transformations to see if there is a common type.
+        auto nested_types_copy = nested_types;
+        transformInferredTypesIfNeededImpl<true>(nested_types_copy, settings, json_info);
+        if (checkIfTypesAreEqual(nested_types_copy))
+        {
+            data_type = std::make_shared<DataTypeArray>(nested_types_copy.back());
+            transformFinalInferredJSONTypeIfNeededImpl(data_type, settings, json_info);
+            return;
+        }
+
+        /// Apply final transformation to nested types, and then try to find common type.
         for (auto & nested_type : nested_types)
             /// Don't change Nothing to String in nested types here, because we are not sure yet if it's Array or actual Tuple
             transformFinalInferredJSONTypeIfNeededImpl(nested_type, settings, json_info, /*remain_nothing_types=*/ true);
 
-        auto nested_types_copy = nested_types;
+        nested_types_copy = nested_types;
         transformInferredTypesIfNeededImpl<true>(nested_types_copy, settings, json_info);
         if (checkIfTypesAreEqual(nested_types_copy))
         {
@@ -1381,7 +1450,6 @@ DataTypePtr makeNullableRecursively(DataTypePtr type)
             return std::make_shared<DataTypeTuple>(std::move(nested_types), tuple_type->getElementNames());
 
         return std::make_shared<DataTypeTuple>(std::move(nested_types));
-
     }
 
     if (which.isMap())
diff --git a/src/Formats/SchemaInferenceUtils.h b/src/Formats/SchemaInferenceUtils.h
index efeb6c9c873..b492d9b22b6 100644
--- a/src/Formats/SchemaInferenceUtils.h
+++ b/src/Formats/SchemaInferenceUtils.h
@@ -14,6 +14,11 @@ struct JSONInferenceInfo
     std::unordered_set<const IDataType *> numbers_parsed_from_json_strings;
     /// Indicates if currently we are inferring type for Map/Object key.
     bool is_object_key = false;
+    /// When we transform types for the same column from different files
+    /// we cannot use DataTypeJSONPaths for inferring named tuples from JSON objects,
+    /// because DataTypeJSONPaths was already finalized to named tuple. IN this case
+    /// we can only merge named tuples from different files together.
+    bool allow_merging_named_tuples = false;
 };
 
 /// Try to determine datatype of the value in buffer/string. If the type cannot be inferred, return nullptr.
@@ -64,9 +69,7 @@ void transformInferredTypesIfNeeded(DataTypePtr & first, DataTypePtr & second, c
 ///     from strings in json_info while inference and use it here, so we will know that Array(Int64) contains
 ///     integer inferred from a string.
 /// Example 2:
-///     When we have maps with different value types, we convert all types to JSON object type.
-///     For example, if we have Map(String, UInt64) (like `{"a" : 123}`) and Map(String, String) (like `{"b" : 'abc'}`)
-///     we will convert both types to Object('JSON').
+///     We merge DataTypeJSONPaths types to a single DataTypeJSONPaths type with union of all JSON paths.
 void transformInferredJSONTypesIfNeeded(DataTypePtr & first, DataTypePtr & second, const FormatSettings & settings, JSONInferenceInfo * json_info);
 
 /// Make final transform for types inferred in JSON format. It does 3 types of transformation:
@@ -78,6 +81,11 @@ void transformInferredJSONTypesIfNeeded(DataTypePtr & first, DataTypePtr & secon
 /// 3) Converts all Nothing types to String types if input_format_json_infer_incomplete_types_as_strings is enabled.
 void transformFinalInferredJSONTypeIfNeeded(DataTypePtr & data_type, const FormatSettings & settings, JSONInferenceInfo * json_info);
 
+/// Transform types for the same column inferred from different files.
+/// Does the same as transformInferredJSONTypesIfNeeded, but also merges named Tuples together,
+/// because DataTypeJSONPaths types were finalized when we finished inference for a file.
+void transformInferredJSONTypesFromDifferentFilesIfNeeded(DataTypePtr & first, DataTypePtr & second, const FormatSettings & settings);
+
 /// Make type Nullable recursively:
 /// - Type -> Nullable(type)
 /// - Array(Type) -> Array(Nullable(Type))
diff --git a/src/Formats/registerFormats.cpp b/src/Formats/registerFormats.cpp
index 6c9f1a94022..cc9cf380693 100644
--- a/src/Formats/registerFormats.cpp
+++ b/src/Formats/registerFormats.cpp
@@ -294,4 +294,3 @@ void registerFormats()
 }
 
 }
-
diff --git a/src/Functions/FunctionBinaryArithmetic.h b/src/Functions/FunctionBinaryArithmetic.h
index 33f62b8da8c..1b2519d1ec5 100644
--- a/src/Functions/FunctionBinaryArithmetic.h
+++ b/src/Functions/FunctionBinaryArithmetic.h
@@ -1483,6 +1483,17 @@ public:
             return getReturnTypeImplStatic(new_arguments, context);
         }
 
+        /// Special case - one or both arguments are IPv6
+        if (isIPv6(arguments[0]) || isIPv6(arguments[1]))
+        {
+            DataTypes new_arguments {
+                    isIPv6(arguments[0]) ? std::make_shared<DataTypeUInt128>() : arguments[0],
+                    isIPv6(arguments[1]) ? std::make_shared<DataTypeUInt128>() : arguments[1],
+            };
+
+            return getReturnTypeImplStatic(new_arguments, context);
+        }
+
 
         if constexpr (is_plus || is_minus)
         {
@@ -2181,6 +2192,25 @@ ColumnPtr executeStringInteger(const ColumnsWithTypeAndName & arguments, const A
             return executeImpl2(new_arguments, result_type, input_rows_count, right_nullmap);
         }
 
+        /// Special case - one or both arguments are IPv6
+        if (isIPv6(arguments[0].type) || isIPv6(arguments[1].type))
+        {
+            ColumnsWithTypeAndName new_arguments {
+                {
+                    isIPv6(arguments[0].type) ? castColumn(arguments[0], std::make_shared<DataTypeUInt128>()) : arguments[0].column,
+                    isIPv6(arguments[0].type) ? std::make_shared<DataTypeUInt128>() : arguments[0].type,
+                    arguments[0].name,
+                },
+                {
+                    isIPv6(arguments[1].type) ? castColumn(arguments[1], std::make_shared<DataTypeUInt128>()) : arguments[1].column,
+                    isIPv6(arguments[1].type) ? std::make_shared<DataTypeUInt128>() : arguments[1].type,
+                    arguments[1].name
+                }
+            };
+
+            return executeImpl2(new_arguments, result_type, input_rows_count, right_nullmap);
+        }
+
         const auto * const left_generic = left_argument.type.get();
         const auto * const right_generic = right_argument.type.get();
         ColumnPtr res;
diff --git a/src/Functions/FunctionSqid.cpp b/src/Functions/FunctionSqid.cpp
index 24868d9a13e..546263914c2 100644
--- a/src/Functions/FunctionSqid.cpp
+++ b/src/Functions/FunctionSqid.cpp
@@ -7,8 +7,8 @@
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Functions/FunctionFactory.h>
-#include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
+#include <Functions/FunctionHelpers.h>
 #include <Interpreters/Context.h>
 
 #include <sqids/sqids.hpp>
@@ -19,7 +19,6 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int SUPPORT_IS_DISABLED;
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
@@ -32,18 +31,8 @@ public:
     String getName() const override { return name; }
     size_t getNumberOfArguments() const override { return 0; }
     bool isVariadic() const override { return true; }
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
-
-    static FunctionPtr create(ContextPtr context)
-    {
-        if (!context->getSettingsRef().allow_experimental_hash_functions)
-            throw Exception(
-                ErrorCodes::SUPPORT_IS_DISABLED,
-                "Hashing function '{}' is experimental. Set `allow_experimental_hash_functions` setting to enable it",
-                name);
-
-        return std::make_shared<FunctionSqid>();
-    }
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionSqid>(); }
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
@@ -71,7 +60,6 @@ public:
         size_t num_args = arguments.size();
         auto col_res = ColumnString::create();
 
-        sqidscxx::Sqids<> sqids;
         std::vector<UInt64> numbers(num_args);
         for (size_t i = 0; i < input_rows_count; ++i)
         {
@@ -86,12 +74,31 @@ public:
         }
         return col_res;
     }
+
+private:
+    sqidscxx::Sqids<> sqids;
 };
 
 REGISTER_FUNCTION(Sqid)
 {
-    factory.registerFunction<FunctionSqid>();
+    factory.registerFunction<FunctionSqid>(FunctionDocumentation{
+        .description=R"(
+Transforms numbers into YouTube-like short URL hash called [Sqid](https://sqids.org/).)",
+        .syntax="sqid(number1, ...)",
+        .arguments={{"number1, ...", "Arbitrarily many UInt8, UInt16, UInt32 or UInt64 arguments"}},
+        .returned_value="A hash id [String](/docs/en/sql-reference/data-types/string.md).",
+        .examples={
+            {"simple",
+            "SELECT sqid(1, 2, 3, 4, 5);",
+            R"(
+┌─sqid(1, 2, 3, 4, 5)─┐
+│ gXHfJ1C6dN          │
+└─────────────────────┘
+            )"
+            }}
+    });
 }
+
 }
 
 #endif
diff --git a/src/Functions/FunctionsAES.cpp b/src/Functions/FunctionsAES.cpp
index 2911d115e35..d1fcd192e6f 100644
--- a/src/Functions/FunctionsAES.cpp
+++ b/src/Functions/FunctionsAES.cpp
@@ -15,14 +15,13 @@ namespace ErrorCodes
 {
     extern const int OPENSSL_ERROR;
 }
-}
+
 
 namespace OpenSSLDetails
 {
 void onError(std::string error_message)
 {
-    error_message += ". OpenSSL error code: " + std::to_string(ERR_get_error());
-    throw DB::Exception::createDeprecated(error_message, DB::ErrorCodes::OPENSSL_ERROR);
+    throw Exception(ErrorCodes::OPENSSL_ERROR, "{}. OpenSSL error code: {}", error_message, ERR_get_error());
 }
 
 StringRef foldEncryptionKeyInMySQLCompatitableMode(size_t cipher_key_size, StringRef key, std::array<char, EVP_MAX_KEY_LENGTH> & folded_key)
@@ -48,4 +47,6 @@ const EVP_CIPHER * getCipherByName(StringRef cipher_name)
 
 }
 
+}
+
 #endif
diff --git a/src/Functions/FunctionsAES.h b/src/Functions/FunctionsAES.h
index c748be5b9b8..4792c997f51 100644
--- a/src/Functions/FunctionsAES.h
+++ b/src/Functions/FunctionsAES.h
@@ -25,13 +25,14 @@
 
 #include <string.h>
 
+
 namespace DB
 {
 namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
 }
-}
+
 
 namespace OpenSSLDetails
 {
@@ -60,7 +61,7 @@ struct KeyHolder
     inline StringRef setKey(size_t cipher_key_size, StringRef key) const
     {
         if (key.size != cipher_key_size)
-            throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid key size: {} expected {}", key.size, cipher_key_size);
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid key size: {} expected {}", key.size, cipher_key_size);
 
         return key;
     }
@@ -72,7 +73,7 @@ struct KeyHolder<CipherMode::MySQLCompatibility>
     inline StringRef setKey(size_t cipher_key_size, StringRef key)
     {
         if (key.size < cipher_key_size)
-            throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid key size: {} expected {}", key.size, cipher_key_size);
+            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid key size: {} expected {}", key.size, cipher_key_size);
 
         // MySQL does something fancy with the keys that are too long,
         // ruining compatibility with OpenSSL and not improving security.
@@ -118,7 +119,7 @@ inline void validateCipherMode(const EVP_CIPHER * evp_cipher)
         }
     }
 
-    throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Unsupported cipher mode");
+    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unsupported cipher mode");
 }
 
 template <CipherMode mode>
@@ -127,13 +128,11 @@ inline void validateIV(StringRef iv_value, const size_t cipher_iv_size)
     // In MySQL mode we don't care if IV is longer than expected, only if shorter.
     if ((mode == CipherMode::MySQLCompatibility && iv_value.size != 0 && iv_value.size < cipher_iv_size)
             || (mode == CipherMode::OpenSSLCompatibility && iv_value.size != 0 && iv_value.size != cipher_iv_size))
-        throw DB::Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid IV size: {} expected {}", iv_value.size, cipher_iv_size);
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid IV size: {} expected {}", iv_value.size, cipher_iv_size);
 }
 
 }
 
-namespace DB
-{
 template <typename Impl>
 class FunctionEncrypt : public IFunction
 {
@@ -313,12 +312,12 @@ private:
                 // in GCM mode IV can be of arbitrary size (>0), IV is optional for other modes.
                 if (mode == CipherMode::RFC5116_AEAD_AES_GCM && iv_value.size == 0)
                 {
-                    throw Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid IV size {} != expected size {}", iv_value.size, iv_size);
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid IV size {} != expected size {}", iv_value.size, iv_size);
                 }
 
                 if (mode != CipherMode::RFC5116_AEAD_AES_GCM && key_value.size != key_size)
                 {
-                    throw Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid key size {} != expected size {}", key_value.size, key_size);
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid key size {} != expected size {}", key_value.size, key_size);
                 }
             }
 
@@ -608,12 +607,12 @@ private:
                 // in GCM mode IV can be of arbitrary size (>0), for other modes IV is optional.
                 if (mode == CipherMode::RFC5116_AEAD_AES_GCM && iv_value.size == 0)
                 {
-                    throw Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid IV size {} != expected size {}", iv_value.size, iv_size);
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid IV size {} != expected size {}", iv_value.size, iv_size);
                 }
 
                 if (key_value.size != key_size)
                 {
-                    throw Exception(DB::ErrorCodes::BAD_ARGUMENTS, "Invalid key size {} != expected size {}", key_value.size, key_size);
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "Invalid key size {} != expected size {}", key_value.size, key_size);
                 }
             }
 
diff --git a/src/Functions/FunctionsConversion.h b/src/Functions/FunctionsConversion.h
index d7c2c70884b..eed75788fcd 100644
--- a/src/Functions/FunctionsConversion.h
+++ b/src/Functions/FunctionsConversion.h
@@ -47,7 +47,6 @@
 #include <Common/Exception.h>
 #include <Core/AccurateComparison.h>
 #include <Functions/IFunctionAdaptors.h>
-#include <Functions/FunctionsMiscellaneous.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/DateTimeTransforms.h>
 #include <Functions/toFixedString.h>
@@ -221,6 +220,18 @@ struct ConvertImpl
                     continue;
                 }
 
+                if constexpr (std::is_same_v<FromDataType, DataTypeIPv6> && std::is_same_v<ToDataType, DataTypeUInt128>)
+                {
+                    static_assert(
+                        std::is_same_v<DataTypeUInt128::FieldType, DataTypeUUID::FieldType::UnderlyingType>,
+                        "UInt128 and IPv6 types must be same");
+
+                    vec_to[i].items[1] = std::byteswap(vec_from[i].toUnderType().items[0]);
+                    vec_to[i].items[0] = std::byteswap(vec_from[i].toUnderType().items[1]);
+
+                    continue;
+                }
+
                 if constexpr (std::is_same_v<FromDataType, DataTypeUUID> != std::is_same_v<ToDataType, DataTypeUUID>)
                 {
                     throw Exception(ErrorCodes::NOT_IMPLEMENTED,
@@ -1401,10 +1412,10 @@ inline bool tryParseImpl<DataTypeDate32>(DataTypeDate32::FieldType & x, ReadBuff
 template <>
 inline bool tryParseImpl<DataTypeDateTime>(DataTypeDateTime::FieldType & x, ReadBuffer & rb, const DateLUTImpl * time_zone, bool)
 {
-    time_t tmp = 0;
-    if (!tryReadDateTimeText(tmp, rb, *time_zone))
+    time_t time = 0;
+    if (!tryReadDateTimeText(time, rb, *time_zone))
         return false;
-    x = static_cast<UInt32>(tmp);
+    convertFromTime<DataTypeDateTime>(x, time);
     return true;
 }
 
@@ -1685,7 +1696,6 @@ struct ConvertThroughParsing
                                     break;
                                 }
                             }
-
                             parseImpl<ToDataType>(vec_to[i], read_buffer, local_time_zone, precise_float_parsing);
                         } while (false);
                     }
@@ -3279,7 +3289,6 @@ private:
         {
             /// In case when converting to Nullable type, we apply different parsing rule,
             /// that will not throw an exception but return NULL in case of malformed input.
-
             FunctionPtr function = FunctionConvertFromString<ToDataType, FunctionName, ConvertFromStringExceptionMode::Null>::create();
             return createFunctionAdaptor(function, from_type);
         }
diff --git a/src/Functions/FunctionsExternalDictionaries.h b/src/Functions/FunctionsExternalDictionaries.h
index db6529da73c..37ddfd6168e 100644
--- a/src/Functions/FunctionsExternalDictionaries.h
+++ b/src/Functions/FunctionsExternalDictionaries.h
@@ -654,7 +654,7 @@ private:
 
             if (tuple_size < 1)
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Tuple second argument of function {} must contain multiple constant string columns");
+                    "Tuple second argument of function {} must contain multiple constant string columns", getName());
 
             for (size_t i = 0; i < tuple_col.tupleSize(); ++i)
             {
diff --git a/src/Functions/FunctionsHashing.h b/src/Functions/FunctionsHashing.h
index 345b9a11e0d..d0edd34e657 100644
--- a/src/Functions/FunctionsHashing.h
+++ b/src/Functions/FunctionsHashing.h
@@ -15,19 +15,13 @@
 #endif
 #include <xxhash.h>
 
-#if USE_BLAKE3
-#    include <blake3.h>
-#endif
-
 #include <Common/SipHash.h>
 #include <Common/typeid_cast.h>
 #include <Common/safe_cast.h>
 #include <Common/HashTable/Hash.h>
 
 #if USE_SSL
-#    include <openssl/md4.h>
 #    include <openssl/md5.h>
-#    include <openssl/sha.h>
 #endif
 
 #include <bit>
@@ -68,7 +62,6 @@ namespace ErrorCodes
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int NOT_IMPLEMENTED;
     extern const int ILLEGAL_COLUMN;
-    extern const int SUPPORT_IS_DISABLED;
 }
 
 namespace impl
@@ -186,6 +179,40 @@ T combineHashesFunc(T t1, T t2)
 }
 
 
+struct SipHash64Impl
+{
+    static constexpr auto name = "sipHash64";
+    using ReturnType = UInt64;
+
+    static UInt64 apply(const char * begin, size_t size) { return sipHash64(begin, size); }
+    static UInt64 combineHashes(UInt64 h1, UInt64 h2) { return combineHashesFunc<UInt64, SipHash64Impl>(h1, h2); }
+
+    static constexpr bool use_int_hash_for_pods = false;
+};
+
+struct SipHash64KeyedImpl
+{
+    static constexpr auto name = "sipHash64Keyed";
+    using ReturnType = UInt64;
+    using Key = impl::SipHashKey;
+    using KeyColumns = impl::SipHashKeyColumns;
+
+    static KeyColumns parseKeyColumns(const ColumnWithTypeAndName & key) { return impl::parseSipHashKeyColumns(key); }
+    static Key getKey(const KeyColumns & key, size_t i) { return key.getKey(i); }
+
+    static UInt64 applyKeyed(const Key & key, const char * begin, size_t size) { return sipHash64Keyed(key.key0, key.key1, begin, size); }
+
+    static UInt64 combineHashesKeyed(const Key & key, UInt64 h1, UInt64 h2)
+    {
+        transformEndianness<std::endian::little>(h1);
+        transformEndianness<std::endian::little>(h2);
+        const UInt64 hashes[]{h1, h2};
+        return applyKeyed(key, reinterpret_cast<const char *>(hashes), sizeof(hashes));
+    }
+
+    static constexpr bool use_int_hash_for_pods = false;
+};
+
 #if USE_SSL
 struct HalfMD5Impl
 {
@@ -220,140 +247,8 @@ struct HalfMD5Impl
 
     static constexpr bool use_int_hash_for_pods = false;
 };
-
-struct MD4Impl
-{
-    static constexpr auto name = "MD4";
-    enum { length = MD4_DIGEST_LENGTH };
-
-    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
-    {
-        MD4_CTX ctx;
-        MD4_Init(&ctx);
-        MD4_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
-        MD4_Final(out_char_data, &ctx);
-    }
-};
-
-struct MD5Impl
-{
-    static constexpr auto name = "MD5";
-    enum { length = MD5_DIGEST_LENGTH };
-
-    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
-    {
-        MD5_CTX ctx;
-        MD5_Init(&ctx);
-        MD5_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
-        MD5_Final(out_char_data, &ctx);
-    }
-};
-
-struct SHA1Impl
-{
-    static constexpr auto name = "SHA1";
-    enum { length = SHA_DIGEST_LENGTH };
-
-    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
-    {
-        SHA_CTX ctx;
-        SHA1_Init(&ctx);
-        SHA1_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
-        SHA1_Final(out_char_data, &ctx);
-    }
-};
-
-struct SHA224Impl
-{
-    static constexpr auto name = "SHA224";
-    enum { length = SHA224_DIGEST_LENGTH };
-
-    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
-    {
-        SHA256_CTX ctx;
-        SHA224_Init(&ctx);
-        SHA224_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
-        SHA224_Final(out_char_data, &ctx);
-    }
-};
-
-struct SHA256Impl
-{
-    static constexpr auto name = "SHA256";
-    enum { length = SHA256_DIGEST_LENGTH };
-
-    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
-    {
-        SHA256_CTX ctx;
-        SHA256_Init(&ctx);
-        SHA256_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
-        SHA256_Final(out_char_data, &ctx);
-    }
-};
-
-struct SHA384Impl
-{
-    static constexpr auto name = "SHA384";
-    enum { length = SHA384_DIGEST_LENGTH };
-
-    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
-    {
-        SHA512_CTX ctx;
-        SHA384_Init(&ctx);
-        SHA384_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
-        SHA384_Final(out_char_data, &ctx);
-    }
-};
-
-struct SHA512Impl
-{
-    static constexpr auto name = "SHA512";
-    enum { length = 64 };
-
-    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
-    {
-        SHA512_CTX ctx;
-        SHA512_Init(&ctx);
-        SHA512_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
-        SHA512_Final(out_char_data, &ctx);
-    }
-};
 #endif
 
-struct SipHash64Impl
-{
-    static constexpr auto name = "sipHash64";
-    using ReturnType = UInt64;
-
-    static UInt64 apply(const char * begin, size_t size) { return sipHash64(begin, size); }
-    static UInt64 combineHashes(UInt64 h1, UInt64 h2) { return combineHashesFunc<UInt64, SipHash64Impl>(h1, h2); }
-
-    static constexpr bool use_int_hash_for_pods = false;
-};
-
-struct SipHash64KeyedImpl
-{
-    static constexpr auto name = "sipHash64Keyed";
-    using ReturnType = UInt64;
-    using Key = impl::SipHashKey;
-    using KeyColumns = impl::SipHashKeyColumns;
-
-    static KeyColumns parseKeyColumns(const ColumnWithTypeAndName & key) { return impl::parseSipHashKeyColumns(key); }
-    static Key getKey(const KeyColumns & key, size_t i) { return key.getKey(i); }
-
-    static UInt64 applyKeyed(const Key & key, const char * begin, size_t size) { return sipHash64Keyed(key.key0, key.key1, begin, size); }
-
-    static UInt64 combineHashesKeyed(const Key & key, UInt64 h1, UInt64 h2)
-    {
-        transformEndianness<std::endian::little>(h1);
-        transformEndianness<std::endian::little>(h2);
-        const UInt64 hashes[]{h1, h2};
-        return applyKeyed(key, reinterpret_cast<const char *>(hashes), sizeof(hashes));
-    }
-
-    static constexpr bool use_int_hash_for_pods = false;
-};
-
 struct SipHash128Impl
 {
     static constexpr auto name = "sipHash128";
@@ -796,121 +691,6 @@ struct ImplXXH3
     static constexpr bool use_int_hash_for_pods = false;
 };
 
-struct ImplBLAKE3
-{
-    static constexpr auto name = "BLAKE3";
-    enum { length = 32 };
-
-#if !USE_BLAKE3
-    [[noreturn]] static void apply(const char * /*begin*/, const size_t /*size*/, unsigned char * /*out_char_data*/)
-    {
-        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "BLAKE3 is not available. Rust code or BLAKE3 itself may be disabled.");
-    }
-#else
-    static void apply(const char * begin, const size_t size, unsigned char* out_char_data)
-    {
-        auto err_msg = blake3_apply_shim(begin, safe_cast<uint32_t>(size), out_char_data);
-        if (err_msg != nullptr)
-        {
-            auto err_st = std::string(err_msg);
-            blake3_free_char_pointer(err_msg);
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Function returned error message: {}", err_st);
-        }
-    }
-#endif
-};
-
-template <typename Impl>
-class FunctionStringHashFixedString : public IFunction
-{
-public:
-    static constexpr auto name = Impl::name;
-    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionStringHashFixedString>(); }
-
-    String getName() const override
-    {
-        return name;
-    }
-
-    size_t getNumberOfArguments() const override { return 1; }
-
-    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
-    {
-        if (!isStringOrFixedString(arguments[0]) && !isIPv6(arguments[0]))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
-                arguments[0]->getName(), getName());
-
-        return std::make_shared<DataTypeFixedString>(Impl::length);
-    }
-
-    bool useDefaultImplementationForConstants() const override { return true; }
-
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/) const override
-    {
-        if (const ColumnString * col_from = checkAndGetColumn<ColumnString>(arguments[0].column.get()))
-        {
-            auto col_to = ColumnFixedString::create(Impl::length);
-
-            const typename ColumnString::Chars & data = col_from->getChars();
-            const typename ColumnString::Offsets & offsets = col_from->getOffsets();
-            auto & chars_to = col_to->getChars();
-            const auto size = offsets.size();
-            chars_to.resize(size * Impl::length);
-
-            ColumnString::Offset current_offset = 0;
-            for (size_t i = 0; i < size; ++i)
-            {
-                Impl::apply(
-                    reinterpret_cast<const char *>(&data[current_offset]),
-                    offsets[i] - current_offset - 1,
-                    reinterpret_cast<uint8_t *>(&chars_to[i * Impl::length]));
-
-                current_offset = offsets[i];
-            }
-
-            return col_to;
-        }
-        else if (
-            const ColumnFixedString * col_from_fix = checkAndGetColumn<ColumnFixedString>(arguments[0].column.get()))
-        {
-            auto col_to = ColumnFixedString::create(Impl::length);
-            const typename ColumnFixedString::Chars & data = col_from_fix->getChars();
-            const auto size = col_from_fix->size();
-            auto & chars_to = col_to->getChars();
-            const auto length = col_from_fix->getN();
-            chars_to.resize(size * Impl::length);
-            for (size_t i = 0; i < size; ++i)
-            {
-                Impl::apply(
-                    reinterpret_cast<const char *>(&data[i * length]), length, reinterpret_cast<uint8_t *>(&chars_to[i * Impl::length]));
-            }
-            return col_to;
-        }
-        else if (
-            const ColumnIPv6 * col_from_ip = checkAndGetColumn<ColumnIPv6>(arguments[0].column.get()))
-        {
-            auto col_to = ColumnFixedString::create(Impl::length);
-            const typename ColumnIPv6::Container & data = col_from_ip->getData();
-            const auto size = col_from_ip->size();
-            auto & chars_to = col_to->getChars();
-            const auto length = IPV6_BINARY_LENGTH;
-            chars_to.resize(size * Impl::length);
-            for (size_t i = 0; i < size; ++i)
-            {
-                Impl::apply(
-                    reinterpret_cast<const char *>(&data[i * length]), length, reinterpret_cast<uint8_t *>(&chars_to[i * Impl::length]));
-            }
-            return col_to;
-        }
-        else
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    arguments[0].column->getName(), getName());
-    }
-};
-
-
 DECLARE_MULTITARGET_CODE(
 
 template <typename Impl, typename Name>
@@ -1793,14 +1573,7 @@ using FunctionSipHash64Keyed = FunctionAnyHash<SipHash64KeyedImpl, true, SipHash
 using FunctionIntHash32 = FunctionIntHash<IntHash32Impl, NameIntHash32>;
 using FunctionIntHash64 = FunctionIntHash<IntHash64Impl, NameIntHash64>;
 #if USE_SSL
-using FunctionMD4 = FunctionStringHashFixedString<MD4Impl>;
 using FunctionHalfMD5 = FunctionAnyHash<HalfMD5Impl>;
-using FunctionMD5 = FunctionStringHashFixedString<MD5Impl>;
-using FunctionSHA1 = FunctionStringHashFixedString<SHA1Impl>;
-using FunctionSHA224 = FunctionStringHashFixedString<SHA224Impl>;
-using FunctionSHA256 = FunctionStringHashFixedString<SHA256Impl>;
-using FunctionSHA384 = FunctionStringHashFixedString<SHA384Impl>;
-using FunctionSHA512 = FunctionStringHashFixedString<SHA512Impl>;
 #endif
 using FunctionSipHash128 = FunctionAnyHash<SipHash128Impl>;
 using FunctionSipHash128Keyed = FunctionAnyHash<SipHash128KeyedImpl, true, SipHash128KeyedImpl::Key, SipHash128KeyedImpl::KeyColumns>;
@@ -1829,7 +1602,6 @@ using FunctionXxHash64 = FunctionAnyHash<ImplXxHash64>;
 using FunctionXXH3 = FunctionAnyHash<ImplXXH3>;
 
 using FunctionWyHash64 = FunctionAnyHash<ImplWyHash64>;
-using FunctionBLAKE3 = FunctionStringHashFixedString<ImplBLAKE3>;
 }
 
 #ifdef __clang__
diff --git a/src/Functions/FunctionsHashingMisc.cpp b/src/Functions/FunctionsHashingMisc.cpp
index f56568b2508..38f16af0e6d 100644
--- a/src/Functions/FunctionsHashingMisc.cpp
+++ b/src/Functions/FunctionsHashingMisc.cpp
@@ -46,19 +46,34 @@ REGISTER_FUNCTION(Hashing)
 
     factory.registerFunction<FunctionWyHash64>();
 
+#if USE_SSL
+    factory.registerFunction<FunctionHalfMD5>(FunctionDocumentation{
+        .description = R"(
+[Interprets](../..//sql-reference/functions/type-conversion-functions.md/#type_conversion_functions-reinterpretAsString) all the input
+parameters as strings and calculates the MD5 hash value for each of them. Then combines hashes, takes the first 8 bytes of the hash of the
+resulting string, and interprets them as [UInt64](../../../sql-reference/data-types/int-uint.md) in big-endian byte order. The function is
+relatively slow (5 million short strings per second per processor core).
 
-    factory.registerFunction<FunctionBLAKE3>(
-    FunctionDocumentation{
-        .description=R"(
-Calculates BLAKE3 hash string and returns the resulting set of bytes as FixedString.
-This cryptographic hash-function is integrated into ClickHouse with BLAKE3 Rust library.
-The function is rather fast and shows approximately two times faster performance compared to SHA-2, while generating hashes of the same length as SHA-256.
-It returns a BLAKE3 hash as a byte array with type FixedString(32).
-)",
-        .examples{
-            {"hash", "SELECT hex(BLAKE3('ABC'))", ""}},
-        .categories{"Hash"}
-    },
-    FunctionFactory::CaseSensitive);
+Consider using the [sipHash64](../../sql-reference/functions/hash-functions.md/#hash_functions-siphash64) function instead.
+                       )",
+        .syntax = "SELECT halfMD5(par1,par2,...,parN);",
+        .arguments
+        = {{"par1,par2,...,parN",
+            R"(
+The function takes a variable number of input parameters. Arguments can be any of the supported data types. For some data types calculated
+value of hash function may be the same for the same values even if types of arguments differ (integers of different size, named and unnamed
+Tuple with the same data, Map and the corresponding Array(Tuple(key, value)) type with the same data).
+                       )"}},
+        .returned_value = "The computed half MD5 hash of the given input params returned as a "
+                          "[UInt64](../../../sql-reference/data-types/int-uint.md) in big-endian byte order.",
+        .examples
+        = {{"",
+            "SELECT HEX(halfMD5('abc', 'cde', 'fgh'));",
+            R"(
+┌─hex(halfMD5('abc', 'cde', 'fgh'))─┐
+│ 2C9506B7374CFAF4                  │
+└───────────────────────────────────┘
+            )"}}});
+#endif
 }
 }
diff --git a/src/Functions/FunctionsHashingSSL.cpp b/src/Functions/FunctionsHashingSSL.cpp
deleted file mode 100644
index 2eb0ed88f28..00000000000
--- a/src/Functions/FunctionsHashingSSL.cpp
+++ /dev/null
@@ -1,28 +0,0 @@
-#include "config.h"
-
-#if USE_SSL
-
-#include "FunctionsHashing.h"
-#include <Functions/FunctionFactory.h>
-
-/// FunctionsHashing instantiations are separated into files FunctionsHashing*.cpp
-/// to better parallelize the build procedure and avoid MSan build failure
-/// due to excessive resource consumption.
-
-namespace DB
-{
-
-REGISTER_FUNCTION(HashingSSL)
-{
-    factory.registerFunction<FunctionMD4>();
-    factory.registerFunction<FunctionHalfMD5>();
-    factory.registerFunction<FunctionMD5>();
-    factory.registerFunction<FunctionSHA1>();
-    factory.registerFunction<FunctionSHA224>();
-    factory.registerFunction<FunctionSHA256>();
-    factory.registerFunction<FunctionSHA384>();
-    factory.registerFunction<FunctionSHA512>();
-}
-}
-
-#endif
diff --git a/src/Functions/FunctionsMiscellaneous.h b/src/Functions/FunctionsMiscellaneous.h
index 75c91a2e964..fb5109eaa88 100644
--- a/src/Functions/FunctionsMiscellaneous.h
+++ b/src/Functions/FunctionsMiscellaneous.h
@@ -159,7 +159,6 @@ private:
 class FunctionCapture : public IFunctionBase
 {
 public:
-    using Capture = ExecutableFunctionCapture::Capture;
     using CapturePtr = ExecutableFunctionCapture::CapturePtr;
 
     FunctionCapture(
@@ -201,10 +200,10 @@ public:
 
     FunctionCaptureOverloadResolver(
             ExpressionActionsPtr expression_actions_,
-            const Names & captured_names_,
-            const NamesAndTypesList & lambda_arguments_,
-            const DataTypePtr & function_return_type_,
-            const String & expression_return_name_)
+            const Names & captured_names,
+            const NamesAndTypesList & lambda_arguments,
+            const DataTypePtr & function_return_type,
+            const String & expression_return_name)
         : expression_actions(std::move(expression_actions_))
     {
         /// Check that expression does not contain unusual actions that will break columns structure.
@@ -219,9 +218,9 @@ public:
             arguments_map[arg.name] = arg.type;
 
         DataTypes captured_types;
-        captured_types.reserve(captured_names_.size());
+        captured_types.reserve(captured_names.size());
 
-        for (const auto & captured_name : captured_names_)
+        for (const auto & captured_name : captured_names)
         {
             auto it = arguments_map.find(captured_name);
             if (it == arguments_map.end())
@@ -232,21 +231,21 @@ public:
         }
 
         DataTypes argument_types;
-        argument_types.reserve(lambda_arguments_.size());
-        for (const auto & lambda_argument : lambda_arguments_)
+        argument_types.reserve(lambda_arguments.size());
+        for (const auto & lambda_argument : lambda_arguments)
             argument_types.push_back(lambda_argument.type);
 
-        return_type = std::make_shared<DataTypeFunction>(argument_types, function_return_type_);
+        return_type = std::make_shared<DataTypeFunction>(argument_types, function_return_type);
 
         name = "Capture[" + toString(captured_types) + "](" + toString(argument_types) + ") -> "
-               + function_return_type_->getName();
+               + function_return_type->getName();
 
         capture = std::make_shared<Capture>(Capture{
-                .captured_names = captured_names_,
+                .captured_names = captured_names,
                 .captured_types = std::move(captured_types),
-                .lambda_arguments = lambda_arguments_,
-                .return_name = expression_return_name_,
-                .return_type = function_return_type_,
+                .lambda_arguments = lambda_arguments,
+                .return_name = expression_return_name,
+                .return_type = function_return_type,
         });
     }
 
diff --git a/src/Functions/FunctionsStringHashFixedString.cpp b/src/Functions/FunctionsStringHashFixedString.cpp
new file mode 100644
index 00000000000..fd42a84fa26
--- /dev/null
+++ b/src/Functions/FunctionsStringHashFixedString.cpp
@@ -0,0 +1,440 @@
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnString.h>
+#include <Columns/ColumnsNumber.h>
+#include <DataTypes/DataTypeFixedString.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
+#include <Functions/IFunction.h>
+#include <base/IPv4andIPv6.h>
+
+#include "config.h"
+
+#if USE_BLAKE3
+#    include <llvm/Support/BLAKE3.h>
+#endif
+
+#if USE_SSL
+#    include <openssl/md4.h>
+#    include <openssl/md5.h>
+#    include <openssl/sha.h>
+#    if USE_BORINGSSL
+#        include <openssl/digest.h>
+#    else
+#        include <openssl/evp.h>
+#    endif
+#endif
+
+/// Instatiating only the functions that require FunctionStringHashFixedString in a separate file
+/// to better parallelize the build procedure and avoid MSan build failure
+/// due to excessive resource consumption.
+
+namespace DB
+{
+namespace ErrorCodes
+{
+extern const int ILLEGAL_COLUMN;
+extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+}
+
+
+#if USE_SSL
+
+struct MD4Impl
+{
+    static constexpr auto name = "MD4";
+    enum
+    {
+        length = MD4_DIGEST_LENGTH
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        MD4_CTX ctx;
+        MD4_Init(&ctx);
+        MD4_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
+        MD4_Final(out_char_data, &ctx);
+    }
+};
+
+struct MD5Impl
+{
+    static constexpr auto name = "MD5";
+    enum
+    {
+        length = MD5_DIGEST_LENGTH
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        MD5_CTX ctx;
+        MD5_Init(&ctx);
+        MD5_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
+        MD5_Final(out_char_data, &ctx);
+    }
+};
+
+struct SHA1Impl
+{
+    static constexpr auto name = "SHA1";
+    enum
+    {
+        length = SHA_DIGEST_LENGTH
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        SHA_CTX ctx;
+        SHA1_Init(&ctx);
+        SHA1_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
+        SHA1_Final(out_char_data, &ctx);
+    }
+};
+
+struct SHA224Impl
+{
+    static constexpr auto name = "SHA224";
+    enum
+    {
+        length = SHA224_DIGEST_LENGTH
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        SHA256_CTX ctx;
+        SHA224_Init(&ctx);
+        SHA224_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
+        SHA224_Final(out_char_data, &ctx);
+    }
+};
+
+struct SHA256Impl
+{
+    static constexpr auto name = "SHA256";
+    enum
+    {
+        length = SHA256_DIGEST_LENGTH
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        SHA256_CTX ctx;
+        SHA256_Init(&ctx);
+        SHA256_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
+        SHA256_Final(out_char_data, &ctx);
+    }
+};
+
+struct SHA384Impl
+{
+    static constexpr auto name = "SHA384";
+    enum
+    {
+        length = SHA384_DIGEST_LENGTH
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        SHA512_CTX ctx;
+        SHA384_Init(&ctx);
+        SHA384_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
+        SHA384_Final(out_char_data, &ctx);
+    }
+};
+
+struct SHA512Impl
+{
+    static constexpr auto name = "SHA512";
+    enum
+    {
+        length = 64
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        SHA512_CTX ctx;
+        SHA512_Init(&ctx);
+        SHA512_Update(&ctx, reinterpret_cast<const unsigned char *>(begin), size);
+        SHA512_Final(out_char_data, &ctx);
+    }
+};
+
+struct SHA512Impl256
+{
+    static constexpr auto name = "SHA512_256";
+    enum
+    {
+        length = 32
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        /// Here, we use the EVP interface that is common to both BoringSSL and OpenSSL. Though BoringSSL is the default
+        /// SSL library that we use, for S390X architecture only OpenSSL is supported. But the SHA512-256, SHA512_256_Init,
+        /// SHA512_256_Update, SHA512_256_Final methods to calculate hash (similar to the other SHA functions) aren't available
+        /// in the current version of OpenSSL that we use which necessitates the use of the EVP interface.
+        auto * md_ctx = EVP_MD_CTX_create();
+        EVP_DigestInit_ex(md_ctx, EVP_sha512_256(), nullptr /*engine*/);
+        EVP_DigestUpdate(md_ctx, begin, size);
+        EVP_DigestFinal_ex(md_ctx, out_char_data, nullptr /*size*/);
+        EVP_MD_CTX_destroy(md_ctx);
+    }
+};
+#endif
+
+#if USE_BLAKE3
+struct ImplBLAKE3
+{
+    static constexpr auto name = "BLAKE3";
+    enum
+    {
+        length = 32
+    };
+
+    static void apply(const char * begin, const size_t size, unsigned char * out_char_data)
+    {
+        static_assert(LLVM_BLAKE3_OUT_LEN == ImplBLAKE3::length);
+        auto & result = *reinterpret_cast<std::array<uint8_t, LLVM_BLAKE3_OUT_LEN> *>(out_char_data);
+
+        llvm::BLAKE3 hasher;
+        if (size > 0)
+            hasher.update(llvm::StringRef(begin, size));
+        hasher.final(result);
+    }
+};
+
+#endif
+
+template <typename Impl>
+class FunctionStringHashFixedString : public IFunction
+{
+public:
+    static constexpr auto name = Impl::name;
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionStringHashFixedString>(); }
+
+    String getName() const override { return name; }
+
+    size_t getNumberOfArguments() const override { return 1; }
+
+    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
+    {
+        if (!isStringOrFixedString(arguments[0]) && !isIPv6(arguments[0]))
+            throw Exception(
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}", arguments[0]->getName(), getName());
+
+        return std::make_shared<DataTypeFixedString>(Impl::length);
+    }
+
+    bool useDefaultImplementationForConstants() const override { return true; }
+
+    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
+
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t /*input_rows_count*/) const override
+    {
+        if (const ColumnString * col_from = checkAndGetColumn<ColumnString>(arguments[0].column.get()))
+        {
+            auto col_to = ColumnFixedString::create(Impl::length);
+
+            const typename ColumnString::Chars & data = col_from->getChars();
+            const typename ColumnString::Offsets & offsets = col_from->getOffsets();
+            auto & chars_to = col_to->getChars();
+            const auto size = offsets.size();
+            chars_to.resize(size * Impl::length);
+
+            ColumnString::Offset current_offset = 0;
+            for (size_t i = 0; i < size; ++i)
+            {
+                Impl::apply(
+                    reinterpret_cast<const char *>(&data[current_offset]),
+                    offsets[i] - current_offset - 1,
+                    reinterpret_cast<uint8_t *>(&chars_to[i * Impl::length]));
+
+                current_offset = offsets[i];
+            }
+
+            return col_to;
+        }
+        else if (const ColumnFixedString * col_from_fix = checkAndGetColumn<ColumnFixedString>(arguments[0].column.get()))
+        {
+            auto col_to = ColumnFixedString::create(Impl::length);
+            const typename ColumnFixedString::Chars & data = col_from_fix->getChars();
+            const auto size = col_from_fix->size();
+            auto & chars_to = col_to->getChars();
+            const auto length = col_from_fix->getN();
+            chars_to.resize(size * Impl::length);
+            for (size_t i = 0; i < size; ++i)
+            {
+                Impl::apply(
+                    reinterpret_cast<const char *>(&data[i * length]), length, reinterpret_cast<uint8_t *>(&chars_to[i * Impl::length]));
+            }
+            return col_to;
+        }
+        else if (const ColumnIPv6 * col_from_ip = checkAndGetColumn<ColumnIPv6>(arguments[0].column.get()))
+        {
+            auto col_to = ColumnFixedString::create(Impl::length);
+            const typename ColumnIPv6::Container & data = col_from_ip->getData();
+            const auto size = col_from_ip->size();
+            auto & chars_to = col_to->getChars();
+            const auto length = IPV6_BINARY_LENGTH;
+            chars_to.resize(size * Impl::length);
+            for (size_t i = 0; i < size; ++i)
+            {
+                Impl::apply(
+                    reinterpret_cast<const char *>(&data[i * length]), length, reinterpret_cast<uint8_t *>(&chars_to[i * Impl::length]));
+            }
+            return col_to;
+        }
+        else
+            throw Exception(
+                ErrorCodes::ILLEGAL_COLUMN,
+                "Illegal column {} of first argument of function {}",
+                arguments[0].column->getName(),
+                getName());
+    }
+};
+
+#if USE_SSL || USE_BLAKE3
+REGISTER_FUNCTION(HashFixedStrings)
+{
+#    if USE_SSL
+    using FunctionMD4 = FunctionStringHashFixedString<MD4Impl>;
+    using FunctionMD5 = FunctionStringHashFixedString<MD5Impl>;
+    using FunctionSHA1 = FunctionStringHashFixedString<SHA1Impl>;
+    using FunctionSHA224 = FunctionStringHashFixedString<SHA224Impl>;
+    using FunctionSHA256 = FunctionStringHashFixedString<SHA256Impl>;
+    using FunctionSHA384 = FunctionStringHashFixedString<SHA384Impl>;
+    using FunctionSHA512 = FunctionStringHashFixedString<SHA512Impl>;
+    using FunctionSHA512_256 = FunctionStringHashFixedString<SHA512Impl256>;
+
+    factory.registerFunction<FunctionMD4>(FunctionDocumentation{
+        .description = R"(Calculates the MD4 hash of the given string.)",
+        .syntax = "SELECT MD4(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The MD4 hash of the given input string returned as a [FixedString(16)](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(MD4('abc'));",
+            R"(
+┌─hex(MD4('abc'))──────────────────┐
+│ A448017AAF21D8525FC10AE87AA6729D │
+└──────────────────────────────────┘
+            )"}}});
+    factory.registerFunction<FunctionMD5>(FunctionDocumentation{
+        .description = R"(Calculates the MD5 hash of the given string.)",
+        .syntax = "SELECT MD5(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The MD5 hash of the given input string returned as a [FixedString(16)](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(MD5('abc'));",
+            R"(
+┌─hex(MD5('abc'))──────────────────┐
+│ 900150983CD24FB0D6963F7D28E17F72 │
+└──────────────────────────────────┘
+            )"}}});
+    factory.registerFunction<FunctionSHA1>(FunctionDocumentation{
+        .description = R"(Calculates the SHA1 hash of the given string.)",
+        .syntax = "SELECT SHA1(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The SHA1 hash of the given input string returned as a [FixedString](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(SHA1('abc'));",
+            R"(
+┌─hex(SHA1('abc'))─────────────────────────┐
+│ A9993E364706816ABA3E25717850C26C9CD0D89D │
+└──────────────────────────────────────────┘
+            )"}}});
+    factory.registerFunction<FunctionSHA224>(FunctionDocumentation{
+        .description = R"(Calculates the SHA224 hash of the given string.)",
+        .syntax = "SELECT SHA224(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The SHA224 hash of the given input string returned as a [FixedString](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(SHA224('abc'));",
+            R"(
+┌─hex(SHA224('abc'))───────────────────────────────────────┐
+│ 23097D223405D8228642A477BDA255B32AADBCE4BDA0B3F7E36C9DA7 │
+└──────────────────────────────────────────────────────────┘
+            )"}}});
+    factory.registerFunction<FunctionSHA256>(FunctionDocumentation{
+        .description = R"(Calculates the SHA256 hash of the given string.)",
+        .syntax = "SELECT SHA256(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The SHA256 hash of the given input string returned as a [FixedString](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(SHA256('abc'));",
+            R"(
+┌─hex(SHA256('abc'))───────────────────────────────────────────────┐
+│ BA7816BF8F01CFEA414140DE5DAE2223B00361A396177A9CB410FF61F20015AD │
+└──────────────────────────────────────────────────────────────────┘
+            )"}}});
+    factory.registerFunction<FunctionSHA384>(FunctionDocumentation{
+        .description = R"(Calculates the SHA384 hash of the given string.)",
+        .syntax = "SELECT SHA384(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The SHA384 hash of the given input string returned as a [FixedString](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(SHA384('abc'));",
+            R"(
+┌─hex(SHA384('abc'))───────────────────────────────────────────────────────────────────────────────┐
+│ CB00753F45A35E8BB5A03D699AC65007272C32AB0EDED1631A8B605A43FF5BED8086072BA1E7CC2358BAECA134C825A7 │
+└──────────────────────────────────────────────────────────────────────────────────────────────────┘
+            )"}}});
+    factory.registerFunction<FunctionSHA512>(FunctionDocumentation{
+        .description = R"(Calculates the SHA512 hash of the given string.)",
+        .syntax = "SELECT SHA512(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The SHA512 hash of the given input string returned as a [FixedString](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(SHA512('abc'));",
+            R"(
+┌─hex(SHA512('abc'))───────────────────────────────────────────────────────────────────────────────────────────────────────────────┐
+│ DDAF35A193617ABACC417349AE20413112E6FA4E89A97EA20A9EEEE64B55D39A2192992A274FC1A836BA3C23A3FEEBBD454D4423643CE80E2A9AC94FA54CA49F │
+└──────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────────┘
+            )"}}});
+    factory.registerFunction<FunctionSHA512_256>(FunctionDocumentation{
+        .description = R"(Calculates the SHA512_256 hash of the given string.)",
+        .syntax = "SELECT SHA512_256(s);",
+        .arguments = {{"s", "The input [String](../../sql-reference/data-types/string.md)."}},
+        .returned_value
+        = "The SHA512_256 hash of the given input string returned as a [FixedString](../../sql-reference/data-types/fixedstring.md).",
+        .examples
+        = {{"",
+            "SELECT HEX(SHA512_256('abc'));",
+            R"(
+┌─hex(SHA512_256('abc'))───────────────────────────────────────────┐
+│ 53048E2681941EF99B2E29B76B4C7DABE4C2D0C634FC6D46E0E2F13107E7AF23 │
+└──────────────────────────────────────────────────────────────────┘
+            )"}}});
+
+
+#    endif
+
+#    if USE_BLAKE3
+    using FunctionBLAKE3 = FunctionStringHashFixedString<ImplBLAKE3>;
+    factory.registerFunction<FunctionBLAKE3>(
+        FunctionDocumentation{
+            .description = R"(
+    Calculates BLAKE3 hash string and returns the resulting set of bytes as FixedString.
+    This cryptographic hash-function is integrated into ClickHouse with BLAKE3 Rust library.
+    The function is rather fast and shows approximately two times faster performance compared to SHA-2, while generating hashes of the same length as SHA-256.
+    It returns a BLAKE3 hash as a byte array with type FixedString(32).
+    )",
+            .examples{{"hash", "SELECT hex(BLAKE3('ABC'))", ""}},
+            .categories{"Hash"}},
+        FunctionFactory::CaseSensitive);
+#    endif
+}
+#endif
+}
diff --git a/src/Functions/GatherUtils/Sources.h b/src/Functions/GatherUtils/Sources.h
index fad2be1f622..222f9f19168 100644
--- a/src/Functions/GatherUtils/Sources.h
+++ b/src/Functions/GatherUtils/Sources.h
@@ -11,6 +11,8 @@
 #include <Common/typeid_cast.h>
 #include <Common/UTF8Helpers.h>
 
+#include <DataTypes/EnumValues.h>
+
 #include "IArraySource.h"
 #include "IValueSource.h"
 #include "Slices.h"
@@ -56,8 +58,8 @@ struct NumericArraySource : public ArraySourceImpl<NumericArraySource<T>>
     }
 
     explicit NumericArraySource(const ColumnArray & arr)
-            : column(typeid_cast<const ColVecType &>(arr.getData()))
-            , elements(typeid_cast<const ColVecType &>(arr.getData()).getData()), offsets(arr.getOffsets())
+        : column(typeid_cast<const ColVecType &>(arr.getData()))
+        , elements(typeid_cast<const ColVecType &>(arr.getData()).getData()), offsets(arr.getOffsets())
     {
     }
 
@@ -154,17 +156,22 @@ struct ConstSource : public Base
     size_t row_num = 0;
 
     explicit ConstSource(const ColumnConst & col_)
-            : Base(static_cast<const typename Base::Column &>(col_.getDataColumn())), total_rows(col_.size())
+        : Base(static_cast<const typename Base::Column &>(col_.getDataColumn()))
+        , total_rows(col_.size())
     {
     }
 
     template <typename ColumnType>
-    ConstSource(const ColumnType & col_, size_t total_rows_) : Base(col_), total_rows(total_rows_)
+    ConstSource(const ColumnType & col_, size_t total_rows_)
+        : Base(col_)
+        , total_rows(total_rows_)
     {
     }
 
     template <typename ColumnType>
-    ConstSource(const ColumnType & col_, const NullMap & null_map_, size_t total_rows_) : Base(col_, null_map_), total_rows(total_rows_)
+    ConstSource(const ColumnType & col_, const NullMap & null_map_, size_t total_rows_)
+        : Base(col_, null_map_)
+        , total_rows(total_rows_)
     {
     }
 
@@ -240,7 +247,8 @@ struct StringSource
     ColumnString::Offset prev_offset = 0;
 
     explicit StringSource(const ColumnString & col)
-            : elements(col.getChars()), offsets(col.getOffsets())
+        : elements(col.getChars())
+        , offsets(col.getOffsets())
     {
     }
 
@@ -313,6 +321,96 @@ struct StringSource
     }
 };
 
+/// Treats Enum values as Strings, modeled after StringSource
+template <typename EnumDataType>
+struct EnumSource
+{
+    using Column = typename EnumDataType::ColumnType;
+    using Slice = NumericArraySlice<UInt8>;
+
+    using SinkType = StringSink;
+
+    const typename Column::Container & data;
+    const EnumDataType & data_type;
+
+    size_t row_num = 0;
+
+    EnumSource(const Column & col, const EnumDataType & data_type_)
+        : data(col.getData())
+        , data_type(data_type_)
+    {
+    }
+
+    void next()
+    {
+        ++row_num;
+    }
+
+    bool isEnd() const
+    {
+        return row_num == data.size();
+    }
+
+    size_t rowNum() const
+    {
+        return row_num;
+    }
+
+    size_t getSizeForReserve() const
+    {
+        return data.size();
+    }
+
+    size_t getElementSize() const
+    {
+        std::string_view name = data_type.getNameForValue(data[row_num]).toView();
+        return name.size();
+    }
+
+    size_t getColumnSize() const
+    {
+        return data.size();
+    }
+
+    Slice getWhole() const
+    {
+        std::string_view name = data_type.getNameForValue(data[row_num]).toView();
+        return {reinterpret_cast<const UInt8 *>(name.data()), name.size()};
+    }
+
+    Slice getSliceFromLeft(size_t offset) const
+    {
+        std::string_view name = data_type.getNameForValue(data[row_num]).toView();
+        if (offset >= name.size())
+            return {reinterpret_cast<const UInt8 *>(name.data()), 0};
+        return {reinterpret_cast<const UInt8 *>(name.data()) + offset, name.size() - offset};
+    }
+
+    Slice getSliceFromLeft(size_t offset, size_t length) const
+    {
+        std::string_view name = data_type.getNameForValue(data[row_num]).toView();
+        if (offset >= name.size())
+            return {reinterpret_cast<const UInt8 *>(name.data()), 0};
+        return {reinterpret_cast<const UInt8 *>(name.data()) + offset, std::min(length, name.size() - offset)};
+    }
+
+    Slice getSliceFromRight(size_t offset) const
+    {
+        std::string_view name = data_type.getNameForValue(data[row_num]).toView();
+        if (offset > name.size())
+            return {reinterpret_cast<const UInt8 *>(name.data()), name.size()};
+        return {reinterpret_cast<const UInt8 *>(name.data()) + name.size() - offset, offset};
+    }
+
+    Slice getSliceFromRight(size_t offset, size_t length) const
+    {
+        std::string_view name = data_type.getNameForValue(data[row_num]).toView();
+        if (offset > name.size())
+            return {reinterpret_cast<const UInt8 *>(name.data()), length + name.size() > offset ? std::min(name.size(), length + name.size() - offset) : 0};
+        return {reinterpret_cast<const UInt8 *>(name.data()) + name.size() - offset, std::min(length, offset)};
+    }
+};
+
 
 /// Differs to StringSource by having 'offset' and 'length' in code points instead of bytes in getSlice* methods.
 /** NOTE: The behaviour of substring and substringUTF8 is inconsistent when negative offset is greater than string size:
@@ -419,7 +517,7 @@ struct FixedStringSource
     size_t column_size = 0;
 
     explicit FixedStringSource(const ColumnFixedString & col)
-            : string_size(col.getN())
+        : string_size(col.getN())
     {
         const auto & chars = col.getChars();
         pos = chars.data();
@@ -553,7 +651,8 @@ struct GenericArraySource : public ArraySourceImpl<GenericArraySource>
     }
 
     explicit GenericArraySource(const ColumnArray & arr)
-            : elements(arr.getData()), offsets(arr.getOffsets())
+        : elements(arr.getData())
+        , offsets(arr.getOffsets())
     {
     }
 
@@ -813,7 +912,10 @@ struct NullableValueSource : public ValueSource
     const NullMap & null_map;
 
     template <typename Column>
-    explicit NullableValueSource(const Column & col, const NullMap & null_map_) : ValueSource(col), null_map(null_map_) {}
+    NullableValueSource(const Column & col, const NullMap & null_map_)
+        : ValueSource(col)
+        , null_map(null_map_)
+    {}
 
     void accept(ValueSourceVisitor & visitor) override { visitor.visit(*this); }
 
diff --git a/src/Functions/GregorianDate.cpp b/src/Functions/GregorianDate.cpp
index f28194781c2..eb7ef4abe56 100644
--- a/src/Functions/GregorianDate.cpp
+++ b/src/Functions/GregorianDate.cpp
@@ -125,7 +125,7 @@ void GregorianDate::init(ReadBuffer & in)
     assertEOF(in);
 
     if (month_ < 1 || month_ > 12 || day_of_month_ < 1 || day_of_month_ > monthLength(is_leap_year(year_), month_))
-        throw Exception(ErrorCodes::CANNOT_PARSE_DATE, "Invalid date, out of range (year: {}, month: {}, day_of_month: {}).");
+        throw Exception(ErrorCodes::CANNOT_PARSE_DATE, "Invalid date, out of range (year: {}, month: {}, day_of_month: {}).", year_, month_, day_of_month_);
 }
 
 bool GregorianDate::tryInit(ReadBuffer & in)
diff --git a/src/Functions/UserDefined/IUserDefinedSQLObjectsLoader.h b/src/Functions/UserDefined/IUserDefinedSQLObjectsLoader.h
deleted file mode 100644
index 4c7850951b5..00000000000
--- a/src/Functions/UserDefined/IUserDefinedSQLObjectsLoader.h
+++ /dev/null
@@ -1,47 +0,0 @@
-#pragma once
-
-#include <base/types.h>
-
-
-namespace DB
-{
-class IAST;
-struct Settings;
-enum class UserDefinedSQLObjectType;
-
-/// Interface for a loader of user-defined SQL objects.
-/// Implementations: UserDefinedSQLLoaderFromDisk, UserDefinedSQLLoaderFromZooKeeper
-class IUserDefinedSQLObjectsLoader
-{
-public:
-    virtual ~IUserDefinedSQLObjectsLoader() = default;
-
-    /// Whether this loader can replicate SQL objects to another node.
-    virtual bool isReplicated() const { return false; }
-    virtual String getReplicationID() const { return ""; }
-
-    /// Loads all objects. Can be called once - if objects are already loaded the function does nothing.
-    virtual void loadObjects() = 0;
-
-    /// Stops watching.
-    virtual void stopWatching() {}
-
-    /// Immediately reloads all objects, throws an exception if failed.
-    virtual void reloadObjects() = 0;
-
-    /// Immediately reloads a specified object only.
-    virtual void reloadObject(UserDefinedSQLObjectType object_type, const String & object_name) = 0;
-
-    /// Stores an object (must be called only by UserDefinedSQLFunctionFactory::registerFunction).
-    virtual bool storeObject(
-        UserDefinedSQLObjectType object_type,
-        const String & object_name,
-        const IAST & create_object_query,
-        bool throw_if_exists,
-        bool replace_if_exists,
-        const Settings & settings) = 0;
-
-    /// Removes an object (must be called only by UserDefinedSQLFunctionFactory::unregisterFunction).
-    virtual bool removeObject(UserDefinedSQLObjectType object_type, const String & object_name, bool throw_if_not_exists) = 0;
-};
-}
diff --git a/src/Functions/UserDefined/IUserDefinedSQLObjectsStorage.h b/src/Functions/UserDefined/IUserDefinedSQLObjectsStorage.h
new file mode 100644
index 00000000000..345ff8c5954
--- /dev/null
+++ b/src/Functions/UserDefined/IUserDefinedSQLObjectsStorage.h
@@ -0,0 +1,74 @@
+#pragma once
+
+#include <base/types.h>
+
+#include <Interpreters/Context_fwd.h>
+
+#include <Parsers/IAST_fwd.h>
+
+
+namespace DB
+{
+class IAST;
+struct Settings;
+enum class UserDefinedSQLObjectType;
+
+/// Interface for a storage of user-defined SQL objects.
+/// Implementations: UserDefinedSQLObjectsDiskStorage, UserDefinedSQLObjectsZooKeeperStorage
+class IUserDefinedSQLObjectsStorage
+{
+public:
+    virtual ~IUserDefinedSQLObjectsStorage() = default;
+
+    /// Whether this loader can replicate SQL objects to another node.
+    virtual bool isReplicated() const { return false; }
+    virtual String getReplicationID() const { return ""; }
+
+    /// Loads all objects. Can be called once - if objects are already loaded the function does nothing.
+    virtual void loadObjects() = 0;
+
+    /// Get object by name. If no object stored with object_name throws exception.
+    virtual ASTPtr get(const String & object_name) const = 0;
+
+    /// Get object by name. If no object stored with object_name return nullptr.
+    virtual ASTPtr tryGet(const String & object_name) const = 0;
+
+    /// Check if object with object_name is stored.
+    virtual bool has(const String & object_name) const = 0;
+
+    /// Get all user defined object names.
+    virtual std::vector<String> getAllObjectNames() const = 0;
+
+    /// Get all user defined objects.
+    virtual std::vector<std::pair<String, ASTPtr>> getAllObjects() const = 0;
+
+    /// Check whether any UDFs have been stored.
+    virtual bool empty() const = 0;
+
+    /// Stops watching.
+    virtual void stopWatching() {}
+
+    /// Immediately reloads all objects, throws an exception if failed.
+    virtual void reloadObjects() = 0;
+
+    /// Immediately reloads a specified object only.
+    virtual void reloadObject(UserDefinedSQLObjectType object_type, const String & object_name) = 0;
+
+    /// Stores an object (must be called only by UserDefinedSQLFunctionFactory::registerFunction).
+    virtual bool storeObject(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        ASTPtr create_object_query,
+        bool throw_if_exists,
+        bool replace_if_exists,
+        const Settings & settings) = 0;
+
+    /// Removes an object (must be called only by UserDefinedSQLFunctionFactory::unregisterFunction).
+    virtual bool removeObject(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        bool throw_if_not_exists) = 0;
+};
+}
diff --git a/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.cpp b/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.cpp
index c4a503589eb..e37e4a23b63 100644
--- a/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.cpp
@@ -3,7 +3,7 @@
 #include <AggregateFunctions/AggregateFunctionFactory.h>
 #include <Backups/RestorerFromBackup.h>
 #include <Functions/FunctionFactory.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
 #include <Functions/UserDefined/UserDefinedExecutableFunctionFactory.h>
 #include <Functions/UserDefined/UserDefinedSQLObjectType.h>
 #include <Functions/UserDefined/UserDefinedSQLObjectsBackup.h>
@@ -14,8 +14,6 @@
 #include <Parsers/ASTIdentifier.h>
 #include <Common/quoteString.h>
 
-#include <boost/container/flat_set.hpp>
-
 
 namespace DB
 {
@@ -23,7 +21,6 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int FUNCTION_ALREADY_EXISTS;
-    extern const int UNKNOWN_FUNCTION;
     extern const int CANNOT_DROP_FUNCTION;
     extern const int CANNOT_CREATE_RECURSIVE_FUNCTION;
     extern const int UNSUPPORTED_METHOD;
@@ -130,20 +127,17 @@ bool UserDefinedSQLFunctionFactory::registerFunction(const ContextMutablePtr & c
     checkCanBeRegistered(context, function_name, *create_function_query);
     create_function_query = normalizeCreateFunctionQuery(*create_function_query);
 
-    std::lock_guard lock{mutex};
-    auto it = function_name_to_create_query_map.find(function_name);
-    if (it != function_name_to_create_query_map.end())
-    {
-        if (throw_if_exists)
-            throw Exception(ErrorCodes::FUNCTION_ALREADY_EXISTS, "User-defined function '{}' already exists", function_name);
-        else if (!replace_if_exists)
-            return false;
-    }
-
     try
     {
-        auto & loader = context->getUserDefinedSQLObjectsLoader();
-        bool stored = loader.storeObject(UserDefinedSQLObjectType::Function, function_name, *create_function_query, throw_if_exists, replace_if_exists, context->getSettingsRef());
+        auto & loader = context->getUserDefinedSQLObjectsStorage();
+        bool stored = loader.storeObject(
+            context,
+            UserDefinedSQLObjectType::Function,
+            function_name,
+            create_function_query,
+            throw_if_exists,
+            replace_if_exists,
+            context->getSettingsRef());
         if (!stored)
             return false;
     }
@@ -153,7 +147,6 @@ bool UserDefinedSQLFunctionFactory::registerFunction(const ContextMutablePtr & c
         throw;
     }
 
-    function_name_to_create_query_map[function_name] = create_function_query;
     return true;
 }
 
@@ -161,20 +154,14 @@ bool UserDefinedSQLFunctionFactory::unregisterFunction(const ContextMutablePtr &
 {
     checkCanBeUnregistered(context, function_name);
 
-    std::lock_guard lock(mutex);
-    auto it = function_name_to_create_query_map.find(function_name);
-    if (it == function_name_to_create_query_map.end())
-    {
-        if (throw_if_not_exists)
-            throw Exception(ErrorCodes::UNKNOWN_FUNCTION, "User-defined function '{}' doesn't exist", function_name);
-        else
-            return false;
-    }
-
     try
     {
-        auto & loader = context->getUserDefinedSQLObjectsLoader();
-        bool removed = loader.removeObject(UserDefinedSQLObjectType::Function, function_name, throw_if_not_exists);
+        auto & storage = context->getUserDefinedSQLObjectsStorage();
+        bool removed = storage.removeObject(
+            context,
+            UserDefinedSQLObjectType::Function,
+            function_name,
+            throw_if_not_exists);
         if (!removed)
             return false;
     }
@@ -184,61 +171,41 @@ bool UserDefinedSQLFunctionFactory::unregisterFunction(const ContextMutablePtr &
         throw;
     }
 
-    function_name_to_create_query_map.erase(function_name);
     return true;
 }
 
 ASTPtr UserDefinedSQLFunctionFactory::get(const String & function_name) const
 {
-    std::lock_guard lock(mutex);
-
-    auto it = function_name_to_create_query_map.find(function_name);
-    if (it == function_name_to_create_query_map.end())
-        throw Exception(ErrorCodes::UNKNOWN_FUNCTION,
-            "The function name '{}' is not registered",
-            function_name);
-
-    return it->second;
+    return global_context->getUserDefinedSQLObjectsStorage().get(function_name);
 }
 
 ASTPtr UserDefinedSQLFunctionFactory::tryGet(const std::string & function_name) const
 {
-    std::lock_guard lock(mutex);
-
-    auto it = function_name_to_create_query_map.find(function_name);
-    if (it == function_name_to_create_query_map.end())
-        return nullptr;
-
-    return it->second;
+    return global_context->getUserDefinedSQLObjectsStorage().tryGet(function_name);
 }
 
 bool UserDefinedSQLFunctionFactory::has(const String & function_name) const
 {
-    return tryGet(function_name) != nullptr;
+    return global_context->getUserDefinedSQLObjectsStorage().has(function_name);
 }
 
 std::vector<std::string> UserDefinedSQLFunctionFactory::getAllRegisteredNames() const
 {
-    std::vector<std::string> registered_names;
-
-    std::lock_guard lock(mutex);
-    registered_names.reserve(function_name_to_create_query_map.size());
-
-    for (const auto & [name, _] : function_name_to_create_query_map)
-        registered_names.emplace_back(name);
-
-    return registered_names;
+    return global_context->getUserDefinedSQLObjectsStorage().getAllObjectNames();
 }
 
 bool UserDefinedSQLFunctionFactory::empty() const
 {
-    std::lock_guard lock(mutex);
-    return function_name_to_create_query_map.empty();
+    return global_context->getUserDefinedSQLObjectsStorage().empty();
 }
 
 void UserDefinedSQLFunctionFactory::backup(BackupEntriesCollector & backup_entries_collector, const String & data_path_in_backup) const
 {
-    backupUserDefinedSQLObjects(backup_entries_collector, data_path_in_backup, UserDefinedSQLObjectType::Function, getAllFunctions());
+    backupUserDefinedSQLObjects(
+        backup_entries_collector,
+        data_path_in_backup,
+        UserDefinedSQLObjectType::Function,
+        global_context->getUserDefinedSQLObjectsStorage().getAllObjects());
 }
 
 void UserDefinedSQLFunctionFactory::restore(RestorerFromBackup & restorer, const String & data_path_in_backup)
@@ -252,52 +219,4 @@ void UserDefinedSQLFunctionFactory::restore(RestorerFromBackup & restorer, const
         registerFunction(context, function_name, create_function_query, throw_if_exists, replace_if_exists);
 }
 
-void UserDefinedSQLFunctionFactory::setAllFunctions(const std::vector<std::pair<String, ASTPtr>> & new_functions)
-{
-    std::unordered_map<String, ASTPtr> normalized_functions;
-    for (const auto & [function_name, create_query] : new_functions)
-        normalized_functions[function_name] = normalizeCreateFunctionQuery(*create_query);
-
-    std::lock_guard lock(mutex);
-    function_name_to_create_query_map = std::move(normalized_functions);
-}
-
-std::vector<std::pair<String, ASTPtr>> UserDefinedSQLFunctionFactory::getAllFunctions() const
-{
-    std::lock_guard lock{mutex};
-    std::vector<std::pair<String, ASTPtr>> all_functions;
-    all_functions.reserve(function_name_to_create_query_map.size());
-    std::copy(function_name_to_create_query_map.begin(), function_name_to_create_query_map.end(), std::back_inserter(all_functions));
-    return all_functions;
-}
-
-void UserDefinedSQLFunctionFactory::setFunction(const String & function_name, const IAST & create_function_query)
-{
-    std::lock_guard lock(mutex);
-    function_name_to_create_query_map[function_name] = normalizeCreateFunctionQuery(create_function_query);
-}
-
-void UserDefinedSQLFunctionFactory::removeFunction(const String & function_name)
-{
-    std::lock_guard lock(mutex);
-    function_name_to_create_query_map.erase(function_name);
-}
-
-void UserDefinedSQLFunctionFactory::removeAllFunctionsExcept(const Strings & function_names_to_keep)
-{
-    boost::container::flat_set<std::string_view> names_set_to_keep{function_names_to_keep.begin(), function_names_to_keep.end()};
-    std::lock_guard lock(mutex);
-    for (auto it = function_name_to_create_query_map.begin(); it != function_name_to_create_query_map.end();)
-    {
-        auto current = it++;
-        if (!names_set_to_keep.contains(current->first))
-            function_name_to_create_query_map.erase(current);
-    }
-}
-
-std::unique_lock<std::recursive_mutex> UserDefinedSQLFunctionFactory::getLock() const
-{
-    return std::unique_lock{mutex};
-}
-
 }
diff --git a/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.h b/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.h
index a7d586061b2..b1f3940323a 100644
--- a/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.h
+++ b/src/Functions/UserDefined/UserDefinedSQLFunctionFactory.h
@@ -6,7 +6,7 @@
 #include <Common/NamePrompter.h>
 
 #include <Parsers/ASTCreateFunctionQuery.h>
-#include <Interpreters/Context_fwd.h>
+#include <Interpreters/Context.h>
 
 
 namespace DB
@@ -48,23 +48,11 @@ public:
     void restore(RestorerFromBackup & restorer, const String & data_path_in_backup);
 
 private:
-    friend class UserDefinedSQLObjectsLoaderFromDisk;
-    friend class UserDefinedSQLObjectsLoaderFromZooKeeper;
-
     /// Checks that a specified function can be registered, throws an exception if not.
     static void checkCanBeRegistered(const ContextPtr & context, const String & function_name, const IAST & create_function_query);
     static void checkCanBeUnregistered(const ContextPtr & context, const String & function_name);
 
-    /// The following functions must be called only by the loader.
-    void setAllFunctions(const std::vector<std::pair<String, ASTPtr>> & new_functions);
-    std::vector<std::pair<String, ASTPtr>> getAllFunctions() const;
-    void setFunction(const String & function_name, const IAST & create_function_query);
-    void removeFunction(const String & function_name);
-    void removeAllFunctionsExcept(const Strings & function_names_to_keep);
-    std::unique_lock<std::recursive_mutex> getLock() const;
-
-    std::unordered_map<String, ASTPtr> function_name_to_create_query_map;
-    mutable std::recursive_mutex mutex;
+    ContextPtr global_context = Context::getGlobalContextInstance();
 };
 
 }
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
index 6920e8ce2c2..3ec5393fa6f 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsBackup.cpp
@@ -6,7 +6,7 @@
 #include <Backups/IBackupCoordination.h>
 #include <Backups/IRestoreCoordination.h>
 #include <Backups/RestorerFromBackup.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
 #include <Functions/UserDefined/UserDefinedSQLObjectType.h>
 #include <Interpreters/Context.h>
 #include <Parsers/ParserCreateFunctionQuery.h>
@@ -37,9 +37,9 @@ void backupUserDefinedSQLObjects(
             escapeForFileName(object_name) + ".sql", std::make_shared<BackupEntryFromMemory>(queryToString(create_object_query)));
 
     auto context = backup_entries_collector.getContext();
-    const auto & loader = context->getUserDefinedSQLObjectsLoader();
+    const auto & storage = context->getUserDefinedSQLObjectsStorage();
 
-    if (!loader.isReplicated())
+    if (!storage.isReplicated())
     {
         fs::path data_path_in_backup_fs{data_path_in_backup};
         for (const auto & [file_name, entry] : backup_entries)
@@ -47,7 +47,7 @@ void backupUserDefinedSQLObjects(
         return;
     }
 
-    String replication_id = loader.getReplicationID();
+    String replication_id = storage.getReplicationID();
 
     auto backup_coordination = backup_entries_collector.getBackupCoordination();
     backup_coordination->addReplicatedSQLObjectsDir(replication_id, object_type, data_path_in_backup);
@@ -80,9 +80,9 @@ std::vector<std::pair<String, ASTPtr>>
 restoreUserDefinedSQLObjects(RestorerFromBackup & restorer, const String & data_path_in_backup, UserDefinedSQLObjectType object_type)
 {
     auto context = restorer.getContext();
-    const auto & loader = context->getUserDefinedSQLObjectsLoader();
+    const auto & storage = context->getUserDefinedSQLObjectsStorage();
 
-    if (loader.isReplicated() && !restorer.getRestoreCoordination()->acquireReplicatedSQLObjects(loader.getReplicationID(), object_type))
+    if (storage.isReplicated() && !restorer.getRestoreCoordination()->acquireReplicatedSQLObjects(storage.getReplicationID(), object_type))
         return {}; /// Other replica is already restoring user-defined SQL objects.
 
     auto backup = restorer.getBackup();
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.cpp
similarity index 80%
rename from src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.cpp
rename to src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.cpp
index d67c48f166d..271c464e79a 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.cpp
@@ -1,4 +1,4 @@
-#include "Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.h"
+#include "Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.h"
 
 #include "Functions/UserDefined/UserDefinedSQLFunctionFactory.h"
 #include "Functions/UserDefined/UserDefinedSQLObjectType.h"
@@ -51,7 +51,7 @@ namespace
     }
 }
 
-UserDefinedSQLObjectsLoaderFromDisk::UserDefinedSQLObjectsLoaderFromDisk(const ContextPtr & global_context_, const String & dir_path_)
+UserDefinedSQLObjectsDiskStorage::UserDefinedSQLObjectsDiskStorage(const ContextPtr & global_context_, const String & dir_path_)
     : global_context(global_context_)
     , dir_path{makeDirectoryPathCanonical(dir_path_)}
     , log{&Poco::Logger::get("UserDefinedSQLObjectsLoaderFromDisk")}
@@ -60,13 +60,13 @@ UserDefinedSQLObjectsLoaderFromDisk::UserDefinedSQLObjectsLoaderFromDisk(const C
 }
 
 
-ASTPtr UserDefinedSQLObjectsLoaderFromDisk::tryLoadObject(UserDefinedSQLObjectType object_type, const String & object_name)
+ASTPtr UserDefinedSQLObjectsDiskStorage::tryLoadObject(UserDefinedSQLObjectType object_type, const String & object_name)
 {
     return tryLoadObject(object_type, object_name, getFilePath(object_type, object_name), /* check_file_exists= */ true);
 }
 
 
-ASTPtr UserDefinedSQLObjectsLoaderFromDisk::tryLoadObject(UserDefinedSQLObjectType object_type, const String & object_name, const String & path, bool check_file_exists)
+ASTPtr UserDefinedSQLObjectsDiskStorage::tryLoadObject(UserDefinedSQLObjectType object_type, const String & object_name, const String & path, bool check_file_exists)
 {
     LOG_DEBUG(log, "Loading user defined object {} from file {}", backQuote(object_name), path);
 
@@ -93,7 +93,6 @@ ASTPtr UserDefinedSQLObjectsLoaderFromDisk::tryLoadObject(UserDefinedSQLObjectTy
                     "",
                     0,
                     global_context->getSettingsRef().max_parser_depth);
-                UserDefinedSQLFunctionFactory::checkCanBeRegistered(global_context, object_name, *ast);
                 return ast;
             }
         }
@@ -106,20 +105,20 @@ ASTPtr UserDefinedSQLObjectsLoaderFromDisk::tryLoadObject(UserDefinedSQLObjectTy
 }
 
 
-void UserDefinedSQLObjectsLoaderFromDisk::loadObjects()
+void UserDefinedSQLObjectsDiskStorage::loadObjects()
 {
     if (!objects_loaded)
         loadObjectsImpl();
 }
 
 
-void UserDefinedSQLObjectsLoaderFromDisk::reloadObjects()
+void UserDefinedSQLObjectsDiskStorage::reloadObjects()
 {
     loadObjectsImpl();
 }
 
 
-void UserDefinedSQLObjectsLoaderFromDisk::loadObjectsImpl()
+void UserDefinedSQLObjectsDiskStorage::loadObjectsImpl()
 {
     LOG_INFO(log, "Loading user defined objects from {}", dir_path);
     createDirectory();
@@ -148,26 +147,25 @@ void UserDefinedSQLObjectsLoaderFromDisk::loadObjectsImpl()
             function_names_and_queries.emplace_back(function_name, ast);
     }
 
-    UserDefinedSQLFunctionFactory::instance().setAllFunctions(function_names_and_queries);
+    setAllObjects(function_names_and_queries);
     objects_loaded = true;
 
     LOG_DEBUG(log, "User defined objects loaded");
 }
 
 
-void UserDefinedSQLObjectsLoaderFromDisk::reloadObject(UserDefinedSQLObjectType object_type, const String & object_name)
+void UserDefinedSQLObjectsDiskStorage::reloadObject(UserDefinedSQLObjectType object_type, const String & object_name)
 {
     createDirectory();
     auto ast = tryLoadObject(object_type, object_name);
-    auto & factory = UserDefinedSQLFunctionFactory::instance();
     if (ast)
-        factory.setFunction(object_name, *ast);
+        setObject(object_name, *ast);
     else
-        factory.removeFunction(object_name);
+        removeObject(object_name);
 }
 
 
-void UserDefinedSQLObjectsLoaderFromDisk::createDirectory()
+void UserDefinedSQLObjectsDiskStorage::createDirectory()
 {
     std::error_code create_dir_error_code;
     fs::create_directories(dir_path, create_dir_error_code);
@@ -177,10 +175,11 @@ void UserDefinedSQLObjectsLoaderFromDisk::createDirectory()
 }
 
 
-bool UserDefinedSQLObjectsLoaderFromDisk::storeObject(
+bool UserDefinedSQLObjectsDiskStorage::storeObjectImpl(
+    const ContextPtr & /*current_context*/,
     UserDefinedSQLObjectType object_type,
     const String & object_name,
-    const IAST & create_object_query,
+    ASTPtr create_object_query,
     bool throw_if_exists,
     bool replace_if_exists,
     const Settings & settings)
@@ -197,7 +196,7 @@ bool UserDefinedSQLObjectsLoaderFromDisk::storeObject(
     }
 
     WriteBufferFromOwnString create_statement_buf;
-    formatAST(create_object_query, create_statement_buf, false);
+    formatAST(*create_object_query, create_statement_buf, false);
     writeChar('\n', create_statement_buf);
     String create_statement = create_statement_buf.str();
 
@@ -228,8 +227,11 @@ bool UserDefinedSQLObjectsLoaderFromDisk::storeObject(
 }
 
 
-bool UserDefinedSQLObjectsLoaderFromDisk::removeObject(
-    UserDefinedSQLObjectType object_type, const String & object_name, bool throw_if_not_exists)
+bool UserDefinedSQLObjectsDiskStorage::removeObjectImpl(
+    const ContextPtr & /*current_context*/,
+    UserDefinedSQLObjectType object_type,
+    const String & object_name,
+    bool throw_if_not_exists)
 {
     String file_path = getFilePath(object_type, object_name);
     LOG_DEBUG(log, "Removing user defined object {} stored in file {}", backQuote(object_name), file_path);
@@ -249,7 +251,7 @@ bool UserDefinedSQLObjectsLoaderFromDisk::removeObject(
 }
 
 
-String UserDefinedSQLObjectsLoaderFromDisk::getFilePath(UserDefinedSQLObjectType object_type, const String & object_name) const
+String UserDefinedSQLObjectsDiskStorage::getFilePath(UserDefinedSQLObjectType object_type, const String & object_name) const
 {
     String file_path;
     switch (object_type)
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.h b/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.h
similarity index 65%
rename from src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.h
rename to src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.h
index 7b0bb291f42..f0986dbda72 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.h
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/UserDefinedSQLObjectsStorageBase.h>
 #include <Interpreters/Context_fwd.h>
 #include <Parsers/IAST_fwd.h>
 
@@ -9,10 +9,10 @@ namespace DB
 {
 
 /// Loads user-defined sql objects from a specified folder.
-class UserDefinedSQLObjectsLoaderFromDisk : public IUserDefinedSQLObjectsLoader
+class UserDefinedSQLObjectsDiskStorage : public UserDefinedSQLObjectsStorageBase
 {
 public:
-    UserDefinedSQLObjectsLoaderFromDisk(const ContextPtr & global_context_, const String & dir_path_);
+    UserDefinedSQLObjectsDiskStorage(const ContextPtr & global_context_, const String & dir_path_);
 
     void loadObjects() override;
 
@@ -20,17 +20,22 @@ public:
 
     void reloadObject(UserDefinedSQLObjectType object_type, const String & object_name) override;
 
-    bool storeObject(
+private:
+    bool storeObjectImpl(
+        const ContextPtr & current_context,
         UserDefinedSQLObjectType object_type,
         const String & object_name,
-        const IAST & create_object_query,
+        ASTPtr create_object_query,
         bool throw_if_exists,
         bool replace_if_exists,
         const Settings & settings) override;
 
-    bool removeObject(UserDefinedSQLObjectType object_type, const String & object_name, bool throw_if_not_exists) override;
+    bool removeObjectImpl(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        bool throw_if_not_exists) override;
 
-private:
     void createDirectory();
     void loadObjectsImpl();
     ASTPtr tryLoadObject(UserDefinedSQLObjectType object_type, const String & object_name);
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsStorageBase.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsStorageBase.cpp
new file mode 100644
index 00000000000..4f47a46b10d
--- /dev/null
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsStorageBase.cpp
@@ -0,0 +1,190 @@
+#include "Functions/UserDefined/UserDefinedSQLObjectsStorageBase.h"
+
+#include <boost/container/flat_set.hpp>
+
+#include <Interpreters/FunctionNameNormalizer.h>
+#include <Parsers/ASTCreateFunctionQuery.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int FUNCTION_ALREADY_EXISTS;
+    extern const int UNKNOWN_FUNCTION;
+}
+
+namespace
+{
+
+ASTPtr normalizeCreateFunctionQuery(const IAST & create_function_query)
+{
+    auto ptr = create_function_query.clone();
+    auto & res = typeid_cast<ASTCreateFunctionQuery &>(*ptr);
+    res.if_not_exists = false;
+    res.or_replace = false;
+    FunctionNameNormalizer().visit(res.function_core.get());
+    return ptr;
+}
+
+}
+
+ASTPtr UserDefinedSQLObjectsStorageBase::get(const String & object_name) const
+{
+    std::lock_guard lock(mutex);
+
+    auto it = object_name_to_create_object_map.find(object_name);
+    if (it == object_name_to_create_object_map.end())
+        throw Exception(ErrorCodes::UNKNOWN_FUNCTION,
+            "The object name '{}' is not saved",
+            object_name);
+
+    return it->second;
+}
+
+ASTPtr UserDefinedSQLObjectsStorageBase::tryGet(const std::string & object_name) const
+{
+    std::lock_guard lock(mutex);
+
+    auto it = object_name_to_create_object_map.find(object_name);
+    if (it == object_name_to_create_object_map.end())
+        return nullptr;
+
+    return it->second;
+}
+
+bool UserDefinedSQLObjectsStorageBase::has(const String & object_name) const
+{
+    return tryGet(object_name) != nullptr;
+}
+
+std::vector<std::string> UserDefinedSQLObjectsStorageBase::getAllObjectNames() const
+{
+    std::vector<std::string> object_names;
+
+    std::lock_guard lock(mutex);
+    object_names.reserve(object_name_to_create_object_map.size());
+
+    for (const auto & [name, _] : object_name_to_create_object_map)
+        object_names.emplace_back(name);
+
+    return object_names;
+}
+
+bool UserDefinedSQLObjectsStorageBase::empty() const
+{
+    std::lock_guard lock(mutex);
+    return object_name_to_create_object_map.empty();
+}
+
+bool UserDefinedSQLObjectsStorageBase::storeObject(
+    const ContextPtr & current_context,
+    UserDefinedSQLObjectType object_type,
+    const String & object_name,
+    ASTPtr create_object_query,
+    bool throw_if_exists,
+    bool replace_if_exists,
+    const Settings & settings)
+{
+    std::lock_guard lock{mutex};
+    auto it = object_name_to_create_object_map.find(object_name);
+    if (it != object_name_to_create_object_map.end())
+    {
+        if (throw_if_exists)
+            throw Exception(ErrorCodes::FUNCTION_ALREADY_EXISTS, "User-defined object '{}' already exists", object_name);
+        else if (!replace_if_exists)
+            return false;
+    }
+
+    bool stored = storeObjectImpl(
+        current_context,
+        object_type,
+        object_name,
+        create_object_query,
+        throw_if_exists,
+        replace_if_exists,
+        settings);
+
+    if (stored)
+        object_name_to_create_object_map[object_name] = create_object_query;
+
+    return stored;
+}
+
+bool UserDefinedSQLObjectsStorageBase::removeObject(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        bool throw_if_not_exists)
+{
+    std::lock_guard lock(mutex);
+    auto it = object_name_to_create_object_map.find(object_name);
+    if (it == object_name_to_create_object_map.end())
+    {
+        if (throw_if_not_exists)
+            throw Exception(ErrorCodes::UNKNOWN_FUNCTION, "User-defined object '{}' doesn't exist", object_name);
+        else
+            return false;
+    }
+
+    bool removed = removeObjectImpl(
+        current_context,
+        object_type,
+        object_name,
+        throw_if_not_exists);
+
+    if (removed)
+        object_name_to_create_object_map.erase(object_name);
+
+    return removed;
+}
+
+std::unique_lock<std::recursive_mutex> UserDefinedSQLObjectsStorageBase::getLock() const
+{
+    return std::unique_lock{mutex};
+}
+
+void UserDefinedSQLObjectsStorageBase::setAllObjects(const std::vector<std::pair<String, ASTPtr>> & new_objects)
+{
+    std::unordered_map<String, ASTPtr> normalized_functions;
+    for (const auto & [function_name, create_query] : new_objects)
+        normalized_functions[function_name] = normalizeCreateFunctionQuery(*create_query);
+
+    std::lock_guard lock(mutex);
+    object_name_to_create_object_map = std::move(normalized_functions);
+}
+
+std::vector<std::pair<String, ASTPtr>> UserDefinedSQLObjectsStorageBase::getAllObjects() const
+{
+    std::lock_guard lock{mutex};
+    std::vector<std::pair<String, ASTPtr>> all_objects;
+    all_objects.reserve(object_name_to_create_object_map.size());
+    std::copy(object_name_to_create_object_map.begin(), object_name_to_create_object_map.end(), std::back_inserter(all_objects));
+    return all_objects;
+}
+
+void UserDefinedSQLObjectsStorageBase::setObject(const String & object_name, const IAST & create_object_query)
+{
+    std::lock_guard lock(mutex);
+    object_name_to_create_object_map[object_name] = normalizeCreateFunctionQuery(create_object_query);
+}
+
+void UserDefinedSQLObjectsStorageBase::removeObject(const String & object_name)
+{
+    std::lock_guard lock(mutex);
+    object_name_to_create_object_map.erase(object_name);
+}
+
+void UserDefinedSQLObjectsStorageBase::removeAllObjectsExcept(const Strings & object_names_to_keep)
+{
+    boost::container::flat_set<std::string_view> names_set_to_keep{object_names_to_keep.begin(), object_names_to_keep.end()};
+    std::lock_guard lock(mutex);
+    for (auto it = object_name_to_create_object_map.begin(); it != object_name_to_create_object_map.end();)
+    {
+        auto current = it++;
+        if (!names_set_to_keep.contains(current->first))
+            object_name_to_create_object_map.erase(current);
+    }
+}
+
+}
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsStorageBase.h b/src/Functions/UserDefined/UserDefinedSQLObjectsStorageBase.h
new file mode 100644
index 00000000000..cab63a3bfcf
--- /dev/null
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsStorageBase.h
@@ -0,0 +1,69 @@
+#pragma once
+
+#include <unordered_map>
+#include <mutex>
+
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
+
+#include <Parsers/IAST.h>
+
+namespace DB
+{
+
+class UserDefinedSQLObjectsStorageBase : public IUserDefinedSQLObjectsStorage
+{
+public:
+    ASTPtr get(const String & object_name) const override;
+
+    ASTPtr tryGet(const String & object_name) const override;
+
+    bool has(const String & object_name) const override;
+
+    std::vector<String> getAllObjectNames() const override;
+
+    std::vector<std::pair<String, ASTPtr>> getAllObjects() const override;
+
+    bool empty() const override;
+
+    bool storeObject(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        ASTPtr create_object_query,
+        bool throw_if_exists,
+        bool replace_if_exists,
+        const Settings & settings) override;
+
+    bool removeObject(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        bool throw_if_not_exists) override;
+
+protected:
+    virtual bool storeObjectImpl(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        ASTPtr create_object_query,
+        bool throw_if_exists,
+        bool replace_if_exists,
+        const Settings & settings) = 0;
+
+    virtual bool removeObjectImpl(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        bool throw_if_not_exists) = 0;
+
+    std::unique_lock<std::recursive_mutex> getLock() const;
+    void setAllObjects(const std::vector<std::pair<String, ASTPtr>> & new_objects);
+    void setObject(const String & object_name, const IAST & create_object_query);
+    void removeObject(const String & object_name);
+    void removeAllObjectsExcept(const Strings & object_names_to_keep);
+
+    std::unordered_map<String, ASTPtr> object_name_to_create_object_map;
+    mutable std::recursive_mutex mutex;
+};
+
+}
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.cpp b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
similarity index 82%
rename from src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.cpp
rename to src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
index 29aff666da5..6e5a5338437 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.cpp
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.cpp
@@ -1,4 +1,4 @@
-#include <Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.h>
+#include <Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.h>
 
 #include <Functions/UserDefined/UserDefinedSQLFunctionFactory.h>
 #include <Functions/UserDefined/UserDefinedSQLObjectType.h>
@@ -47,7 +47,7 @@ namespace
 }
 
 
-UserDefinedSQLObjectsLoaderFromZooKeeper::UserDefinedSQLObjectsLoaderFromZooKeeper(
+UserDefinedSQLObjectsZooKeeperStorage::UserDefinedSQLObjectsZooKeeperStorage(
     const ContextPtr & global_context_, const String & zookeeper_path_)
     : global_context{global_context_}
     , zookeeper_getter{[global_context_]() { return global_context_->getZooKeeper(); }}
@@ -66,20 +66,20 @@ UserDefinedSQLObjectsLoaderFromZooKeeper::UserDefinedSQLObjectsLoaderFromZooKeep
         zookeeper_path = "/" + zookeeper_path;
 }
 
-UserDefinedSQLObjectsLoaderFromZooKeeper::~UserDefinedSQLObjectsLoaderFromZooKeeper()
+UserDefinedSQLObjectsZooKeeperStorage::~UserDefinedSQLObjectsZooKeeperStorage()
 {
     SCOPE_EXIT_SAFE(stopWatchingThread());
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::startWatchingThread()
+void UserDefinedSQLObjectsZooKeeperStorage::startWatchingThread()
 {
     if (!watching_flag.exchange(true))
     {
-        watching_thread = ThreadFromGlobalPool(&UserDefinedSQLObjectsLoaderFromZooKeeper::processWatchQueue, this);
+        watching_thread = ThreadFromGlobalPool(&UserDefinedSQLObjectsZooKeeperStorage::processWatchQueue, this);
     }
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::stopWatchingThread()
+void UserDefinedSQLObjectsZooKeeperStorage::stopWatchingThread()
 {
     if (watching_flag.exchange(false))
     {
@@ -89,7 +89,7 @@ void UserDefinedSQLObjectsLoaderFromZooKeeper::stopWatchingThread()
     }
 }
 
-zkutil::ZooKeeperPtr UserDefinedSQLObjectsLoaderFromZooKeeper::getZooKeeper()
+zkutil::ZooKeeperPtr UserDefinedSQLObjectsZooKeeperStorage::getZooKeeper()
 {
     auto [zookeeper, session_status] = zookeeper_getter.getZooKeeper();
 
@@ -106,18 +106,18 @@ zkutil::ZooKeeperPtr UserDefinedSQLObjectsLoaderFromZooKeeper::getZooKeeper()
     return zookeeper;
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::initZooKeeperIfNeeded()
+void UserDefinedSQLObjectsZooKeeperStorage::initZooKeeperIfNeeded()
 {
     getZooKeeper();
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::resetAfterError()
+void UserDefinedSQLObjectsZooKeeperStorage::resetAfterError()
 {
     zookeeper_getter.resetCache();
 }
 
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::loadObjects()
+void UserDefinedSQLObjectsZooKeeperStorage::loadObjects()
 {
     /// loadObjects() is called at start from Server::main(), so it's better not to stop here on no connection to ZooKeeper or any other error.
     /// However the watching thread must be started anyway in case the connection will be established later.
@@ -136,7 +136,7 @@ void UserDefinedSQLObjectsLoaderFromZooKeeper::loadObjects()
 }
 
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::processWatchQueue()
+void UserDefinedSQLObjectsZooKeeperStorage::processWatchQueue()
 {
     LOG_DEBUG(log, "Started watching thread");
     setThreadName("UserDefObjWatch");
@@ -173,13 +173,13 @@ void UserDefinedSQLObjectsLoaderFromZooKeeper::processWatchQueue()
 }
 
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::stopWatching()
+void UserDefinedSQLObjectsZooKeeperStorage::stopWatching()
 {
     stopWatchingThread();
 }
 
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::reloadObjects()
+void UserDefinedSQLObjectsZooKeeperStorage::reloadObjects()
 {
     auto zookeeper = getZooKeeper();
     refreshAllObjects(zookeeper);
@@ -187,23 +187,24 @@ void UserDefinedSQLObjectsLoaderFromZooKeeper::reloadObjects()
 }
 
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::reloadObject(UserDefinedSQLObjectType object_type, const String & object_name)
+void UserDefinedSQLObjectsZooKeeperStorage::reloadObject(UserDefinedSQLObjectType object_type, const String & object_name)
 {
     auto zookeeper = getZooKeeper();
     refreshObject(zookeeper, object_type, object_name);
 }
 
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::createRootNodes(const zkutil::ZooKeeperPtr & zookeeper)
+void UserDefinedSQLObjectsZooKeeperStorage::createRootNodes(const zkutil::ZooKeeperPtr & zookeeper)
 {
     zookeeper->createAncestors(zookeeper_path);
     zookeeper->createIfNotExists(zookeeper_path, "");
 }
 
-bool UserDefinedSQLObjectsLoaderFromZooKeeper::storeObject(
+bool UserDefinedSQLObjectsZooKeeperStorage::storeObjectImpl(
+    const ContextPtr & /*current_context*/,
     UserDefinedSQLObjectType object_type,
     const String & object_name,
-    const IAST & create_object_query,
+    ASTPtr create_object_query,
     bool throw_if_exists,
     bool replace_if_exists,
     const Settings &)
@@ -212,7 +213,7 @@ bool UserDefinedSQLObjectsLoaderFromZooKeeper::storeObject(
     LOG_DEBUG(log, "Storing user-defined object {} at zk path {}", backQuote(object_name), path);
 
     WriteBufferFromOwnString create_statement_buf;
-    formatAST(create_object_query, create_statement_buf, false);
+    formatAST(*create_object_query, create_statement_buf, false);
     writeChar('\n', create_statement_buf);
     String create_statement = create_statement_buf.str();
 
@@ -252,8 +253,11 @@ bool UserDefinedSQLObjectsLoaderFromZooKeeper::storeObject(
 }
 
 
-bool UserDefinedSQLObjectsLoaderFromZooKeeper::removeObject(
-    UserDefinedSQLObjectType object_type, const String & object_name, bool throw_if_not_exists)
+bool UserDefinedSQLObjectsZooKeeperStorage::removeObjectImpl(
+    const ContextPtr & /*current_context*/,
+    UserDefinedSQLObjectType object_type,
+    const String & object_name,
+    bool throw_if_not_exists)
 {
     String path = getNodePath(zookeeper_path, object_type, object_name);
     LOG_DEBUG(log, "Removing user-defined object {} at zk path {}", backQuote(object_name), path);
@@ -276,7 +280,7 @@ bool UserDefinedSQLObjectsLoaderFromZooKeeper::removeObject(
     return true;
 }
 
-bool UserDefinedSQLObjectsLoaderFromZooKeeper::getObjectDataAndSetWatch(
+bool UserDefinedSQLObjectsZooKeeperStorage::getObjectDataAndSetWatch(
     const zkutil::ZooKeeperPtr & zookeeper,
     String & data,
     const String & path,
@@ -298,7 +302,7 @@ bool UserDefinedSQLObjectsLoaderFromZooKeeper::getObjectDataAndSetWatch(
     return zookeeper->tryGetWatch(path, data, &entity_stat, object_watcher);
 }
 
-ASTPtr UserDefinedSQLObjectsLoaderFromZooKeeper::parseObjectData(const String & object_data, UserDefinedSQLObjectType object_type)
+ASTPtr UserDefinedSQLObjectsZooKeeperStorage::parseObjectData(const String & object_data, UserDefinedSQLObjectType object_type)
 {
     switch (object_type)
     {
@@ -317,7 +321,7 @@ ASTPtr UserDefinedSQLObjectsLoaderFromZooKeeper::parseObjectData(const String &
     UNREACHABLE();
 }
 
-ASTPtr UserDefinedSQLObjectsLoaderFromZooKeeper::tryLoadObject(
+ASTPtr UserDefinedSQLObjectsZooKeeperStorage::tryLoadObject(
     const zkutil::ZooKeeperPtr & zookeeper, UserDefinedSQLObjectType object_type, const String & object_name)
 {
     String path = getNodePath(zookeeper_path, object_type, object_name);
@@ -343,7 +347,7 @@ ASTPtr UserDefinedSQLObjectsLoaderFromZooKeeper::tryLoadObject(
     }
 }
 
-Strings UserDefinedSQLObjectsLoaderFromZooKeeper::getObjectNamesAndSetWatch(
+Strings UserDefinedSQLObjectsZooKeeperStorage::getObjectNamesAndSetWatch(
     const zkutil::ZooKeeperPtr & zookeeper, UserDefinedSQLObjectType object_type)
 {
     auto object_list_watcher = [my_watch_queue = watch_queue, object_type](const Coordination::WatchResponse &)
@@ -371,7 +375,7 @@ Strings UserDefinedSQLObjectsLoaderFromZooKeeper::getObjectNamesAndSetWatch(
     return object_names;
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::refreshAllObjects(const zkutil::ZooKeeperPtr & zookeeper)
+void UserDefinedSQLObjectsZooKeeperStorage::refreshAllObjects(const zkutil::ZooKeeperPtr & zookeeper)
 {
     /// It doesn't make sense to keep the old watch events because we will reread everything in this function.
     watch_queue->clear();
@@ -380,7 +384,7 @@ void UserDefinedSQLObjectsLoaderFromZooKeeper::refreshAllObjects(const zkutil::Z
     objects_loaded = true;
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::refreshObjects(const zkutil::ZooKeeperPtr & zookeeper, UserDefinedSQLObjectType object_type)
+void UserDefinedSQLObjectsZooKeeperStorage::refreshObjects(const zkutil::ZooKeeperPtr & zookeeper, UserDefinedSQLObjectType object_type)
 {
     LOG_DEBUG(log, "Refreshing all user-defined {} objects", object_type);
     Strings object_names = getObjectNamesAndSetWatch(zookeeper, object_type);
@@ -393,21 +397,20 @@ void UserDefinedSQLObjectsLoaderFromZooKeeper::refreshObjects(const zkutil::ZooK
             function_names_and_asts.emplace_back(function_name, ast);
     }
 
-    UserDefinedSQLFunctionFactory::instance().setAllFunctions(function_names_and_asts);
+    setAllObjects(function_names_and_asts);
 
     LOG_DEBUG(log, "All user-defined {} objects refreshed", object_type);
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::syncObjects(const zkutil::ZooKeeperPtr & zookeeper, UserDefinedSQLObjectType object_type)
+void UserDefinedSQLObjectsZooKeeperStorage::syncObjects(const zkutil::ZooKeeperPtr & zookeeper, UserDefinedSQLObjectType object_type)
 {
     LOG_DEBUG(log, "Syncing user-defined {} objects", object_type);
     Strings object_names = getObjectNamesAndSetWatch(zookeeper, object_type);
 
-    auto & factory = UserDefinedSQLFunctionFactory::instance();
-    auto lock = factory.getLock();
+    getLock();
 
     /// Remove stale objects
-    factory.removeAllFunctionsExcept(object_names);
+    removeAllObjectsExcept(object_names);
     /// Read & parse only new SQL objects from ZooKeeper
     for (const auto & function_name : object_names)
     {
@@ -418,16 +421,15 @@ void UserDefinedSQLObjectsLoaderFromZooKeeper::syncObjects(const zkutil::ZooKeep
     LOG_DEBUG(log, "User-defined {} objects synced", object_type);
 }
 
-void UserDefinedSQLObjectsLoaderFromZooKeeper::refreshObject(
+void UserDefinedSQLObjectsZooKeeperStorage::refreshObject(
     const zkutil::ZooKeeperPtr & zookeeper, UserDefinedSQLObjectType object_type, const String & object_name)
 {
     auto ast = tryLoadObject(zookeeper, object_type, object_name);
-    auto & factory = UserDefinedSQLFunctionFactory::instance();
 
     if (ast)
-        factory.setFunction(object_name, *ast);
+        setObject(object_name, *ast);
     else
-        factory.removeFunction(object_name);
+        removeObject(object_name);
 }
 
 }
diff --git a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.h b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.h
similarity index 80%
rename from src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.h
rename to src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.h
index 38e061fd4d9..9f41763c59c 100644
--- a/src/Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.h
+++ b/src/Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.h
@@ -1,6 +1,6 @@
 #pragma once
 
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/UserDefinedSQLObjectsStorageBase.h>
 #include <Interpreters/Context_fwd.h>
 #include <Parsers/IAST_fwd.h>
 #include <Common/ConcurrentBoundedQueue.h>
@@ -12,11 +12,11 @@ namespace DB
 {
 
 /// Loads user-defined sql objects from ZooKeeper.
-class UserDefinedSQLObjectsLoaderFromZooKeeper : public IUserDefinedSQLObjectsLoader
+class UserDefinedSQLObjectsZooKeeperStorage : public UserDefinedSQLObjectsStorageBase
 {
 public:
-    UserDefinedSQLObjectsLoaderFromZooKeeper(const ContextPtr & global_context_, const String & zookeeper_path_);
-    ~UserDefinedSQLObjectsLoaderFromZooKeeper() override;
+    UserDefinedSQLObjectsZooKeeperStorage(const ContextPtr & global_context_, const String & zookeeper_path_);
+    ~UserDefinedSQLObjectsZooKeeperStorage() override;
 
     bool isReplicated() const override { return true; }
     String getReplicationID() const override { return zookeeper_path; }
@@ -26,16 +26,21 @@ public:
     void reloadObjects() override;
     void reloadObject(UserDefinedSQLObjectType object_type, const String & object_name) override;
 
-    bool storeObject(
+private:
+    bool storeObjectImpl(
+        const ContextPtr & current_context,
         UserDefinedSQLObjectType object_type,
         const String & object_name,
-        const IAST & create_object_query,
+        ASTPtr create_object_query,
         bool throw_if_exists,
         bool replace_if_exists,
         const Settings & settings) override;
-    bool removeObject(UserDefinedSQLObjectType object_type, const String & object_name, bool throw_if_not_exists) override;
+    bool removeObjectImpl(
+        const ContextPtr & current_context,
+        UserDefinedSQLObjectType object_type,
+        const String & object_name,
+        bool throw_if_not_exists) override;
 
-private:
     void processWatchQueue();
 
     zkutil::ZooKeeperPtr getZooKeeper();
diff --git a/src/Functions/UserDefined/createUserDefinedSQLObjectsLoader.h b/src/Functions/UserDefined/createUserDefinedSQLObjectsLoader.h
deleted file mode 100644
index b3a4623dba3..00000000000
--- a/src/Functions/UserDefined/createUserDefinedSQLObjectsLoader.h
+++ /dev/null
@@ -1,12 +0,0 @@
-#pragma once
-
-#include <Interpreters/Context_fwd.h>
-
-
-namespace DB
-{
-class IUserDefinedSQLObjectsLoader;
-
-std::unique_ptr<IUserDefinedSQLObjectsLoader> createUserDefinedSQLObjectsLoader(const ContextMutablePtr & global_context);
-
-}
diff --git a/src/Functions/UserDefined/createUserDefinedSQLObjectsLoader.cpp b/src/Functions/UserDefined/createUserDefinedSQLObjectsStorage.cpp
similarity index 61%
rename from src/Functions/UserDefined/createUserDefinedSQLObjectsLoader.cpp
rename to src/Functions/UserDefined/createUserDefinedSQLObjectsStorage.cpp
index b7ebc7abf14..f8847024508 100644
--- a/src/Functions/UserDefined/createUserDefinedSQLObjectsLoader.cpp
+++ b/src/Functions/UserDefined/createUserDefinedSQLObjectsStorage.cpp
@@ -1,6 +1,6 @@
-#include <Functions/UserDefined/createUserDefinedSQLObjectsLoader.h>
-#include <Functions/UserDefined/UserDefinedSQLObjectsLoaderFromDisk.h>
-#include <Functions/UserDefined/UserDefinedSQLObjectsLoaderFromZooKeeper.h>
+#include <Functions/UserDefined/createUserDefinedSQLObjectsStorage.h>
+#include <Functions/UserDefined/UserDefinedSQLObjectsDiskStorage.h>
+#include <Functions/UserDefined/UserDefinedSQLObjectsZooKeeperStorage.h>
 #include <Interpreters/Context.h>
 #include <Poco/Util/AbstractConfiguration.h>
 #include <filesystem>
@@ -17,7 +17,7 @@ namespace ErrorCodes
     extern const int INVALID_CONFIG_PARAMETER;
 }
 
-std::unique_ptr<IUserDefinedSQLObjectsLoader> createUserDefinedSQLObjectsLoader(const ContextMutablePtr & global_context)
+std::unique_ptr<IUserDefinedSQLObjectsStorage> createUserDefinedSQLObjectsStorage(const ContextMutablePtr & global_context)
 {
     const String zookeeper_path_key = "user_defined_zookeeper_path";
     const String disk_path_key = "user_defined_path";
@@ -33,12 +33,12 @@ std::unique_ptr<IUserDefinedSQLObjectsLoader> createUserDefinedSQLObjectsLoader(
                 zookeeper_path_key,
                 disk_path_key);
         }
-        return std::make_unique<UserDefinedSQLObjectsLoaderFromZooKeeper>(global_context, config.getString(zookeeper_path_key));
+        return std::make_unique<UserDefinedSQLObjectsZooKeeperStorage>(global_context, config.getString(zookeeper_path_key));
     }
 
     String default_path = fs::path{global_context->getPath()} / "user_defined/";
     String path = config.getString(disk_path_key, default_path);
-    return std::make_unique<UserDefinedSQLObjectsLoaderFromDisk>(global_context, path);
+    return std::make_unique<UserDefinedSQLObjectsDiskStorage>(global_context, path);
 }
 
 }
diff --git a/src/Functions/UserDefined/createUserDefinedSQLObjectsStorage.h b/src/Functions/UserDefined/createUserDefinedSQLObjectsStorage.h
new file mode 100644
index 00000000000..01659372dec
--- /dev/null
+++ b/src/Functions/UserDefined/createUserDefinedSQLObjectsStorage.h
@@ -0,0 +1,12 @@
+#pragma once
+
+#include <Interpreters/Context_fwd.h>
+
+
+namespace DB
+{
+class IUserDefinedSQLObjectsStorage;
+
+std::unique_ptr<IUserDefinedSQLObjectsStorage> createUserDefinedSQLObjectsStorage(const ContextMutablePtr & global_context);
+
+}
diff --git a/src/Functions/aes_decrypt_mysql.cpp b/src/Functions/aes_decrypt_mysql.cpp
index bb8ef3809d1..8043fa422ad 100644
--- a/src/Functions/aes_decrypt_mysql.cpp
+++ b/src/Functions/aes_decrypt_mysql.cpp
@@ -5,6 +5,10 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsAES.h>
 
+
+namespace DB
+{
+
 namespace
 {
 
@@ -17,9 +21,6 @@ struct DecryptMySQLModeImpl
 
 }
 
-namespace DB
-{
-
 REGISTER_FUNCTION(AESDecryptMysql)
 {
     factory.registerFunction<FunctionDecrypt<DecryptMySQLModeImpl>>();
diff --git a/src/Functions/aes_encrypt_mysql.cpp b/src/Functions/aes_encrypt_mysql.cpp
index 0dcb4108770..fb120151c25 100644
--- a/src/Functions/aes_encrypt_mysql.cpp
+++ b/src/Functions/aes_encrypt_mysql.cpp
@@ -5,6 +5,9 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsAES.h>
 
+namespace DB
+{
+
 namespace
 {
 
@@ -16,9 +19,6 @@ struct EncryptMySQLModeImpl
 
 }
 
-namespace DB
-{
-
 REGISTER_FUNCTION(AESEncryptMysql)
 {
     factory.registerFunction<FunctionEncrypt<EncryptMySQLModeImpl>>();
diff --git a/src/Functions/array/FunctionArrayMapped.h b/src/Functions/array/FunctionArrayMapped.h
index a7ab80f697a..9773673c63c 100644
--- a/src/Functions/array/FunctionArrayMapped.h
+++ b/src/Functions/array/FunctionArrayMapped.h
@@ -74,6 +74,8 @@ public:
     size_t getNumberOfArguments() const override { return 0; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
 
+    bool useDefaultImplementationForConstants() const override { return true; }
+
     /// Called if at least one function argument is a lambda expression.
     /// For argument-lambda expressions, it defines the types of arguments of these expressions.
     void getLambdaArgumentTypes(DataTypes & arguments) const override
@@ -370,10 +372,10 @@ public:
 
             /// Put all the necessary columns multiplied by the sizes of arrays into the columns.
             auto replicated_column_function_ptr = IColumn::mutate(column_function->replicate(column_first_array->getOffsets()));
-            auto * replicated_column_function = typeid_cast<ColumnFunction *>(replicated_column_function_ptr.get());
-            replicated_column_function->appendArguments(arrays);
+            auto & replicated_column_function = typeid_cast<ColumnFunction &>(*replicated_column_function_ptr);
+            replicated_column_function.appendArguments(arrays);
 
-            auto lambda_result = replicated_column_function->reduce();
+            auto lambda_result = replicated_column_function.reduce();
 
             /// Convert LowCardinality(T) -> T and Const(LowCardinality(T)) -> Const(T),
             /// because we removed LowCardinality from return type of lambda expression.
diff --git a/src/Functions/array/arrayFold.cpp b/src/Functions/array/arrayFold.cpp
index b5b650e7289..44fe95624a6 100644
--- a/src/Functions/array/arrayFold.cpp
+++ b/src/Functions/array/arrayFold.cpp
@@ -1,6 +1,11 @@
-#include "FunctionArrayMapped.h"
-#include <Functions/FunctionFactory.h>
+#include <Columns/ColumnArray.h>
+#include <Columns/ColumnFunction.h>
 #include <Common/Exception.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeFunction.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionHelpers.h>
 
 namespace DB
 {
@@ -15,13 +20,13 @@ namespace ErrorCodes
 }
 
 /**
- * arrayFold(x1,...,xn,accum -> expression, array1,...,arrayn, accum_initial) - apply the expression to each element of the array (or set of arrays).
+ * arrayFold( acc,a1,...,aN->expr, arr1, ..., arrN, acc_initial)
  */
-class ArrayFold : public IFunction
+class FunctionArrayFold : public IFunction
 {
 public:
     static constexpr auto name = "arrayFold";
-    static FunctionPtr create(ContextPtr) { return std::make_shared<ArrayFold>(); }
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionArrayFold>(); }
 
     bool isVariadic() const override { return true; }
     size_t getNumberOfArguments() const override { return 0; }
@@ -80,143 +85,192 @@ public:
         if (!lambda_function)
             throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "First argument for function {} must be a function", getName());
 
-        ColumnPtr offsets_column;
-        ColumnPtr column_first_array_ptr;
-        const ColumnArray * column_first_array = nullptr;
-        ColumnsWithTypeAndName arrays;
-        arrays.reserve(arguments.size() - 1);
+        ColumnPtr first_array_col;
+        const ColumnArray * first_array_col_concrete = nullptr;
+        ColumnPtr first_array_col_offsets;
 
-        /// Validate input types and get input array columns in convenient form
+        ColumnsWithTypeAndName arrays_data_with_type_and_name; /// for all arrays, the pointers to the internal data column, type and name
+        arrays_data_with_type_and_name.reserve(arguments.size() - 1);
+
+        /// Validate array arguments and set pointers so we can access them more conveniently
         for (size_t i = 1; i < arguments.size() - 1; ++i)
         {
             const auto & array_with_type_and_name = arguments[i];
-            ColumnPtr column_array_ptr = array_with_type_and_name.column;
-            const auto * column_array = checkAndGetColumn<ColumnArray>(column_array_ptr.get());
-            if (!column_array)
+            ColumnPtr array_col = array_with_type_and_name.column;
+            const auto * array_col_concrete = checkAndGetColumn<ColumnArray>(array_col.get());
+            if (!array_col_concrete)
             {
-                const ColumnConst * column_const_array = checkAndGetColumnConst<ColumnArray>(column_array_ptr.get());
-                if (!column_const_array)
-                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Expected array column, found {}", column_array_ptr->getName());
-                column_array_ptr = recursiveRemoveLowCardinality(column_const_array->convertToFullColumn());
-                column_array = checkAndGetColumn<ColumnArray>(column_array_ptr.get());
+                const ColumnConst * aray_col_concrete_const = checkAndGetColumnConst<ColumnArray>(array_col.get());
+                if (!aray_col_concrete_const)
+                    throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Expected array column, found {}", array_col->getName());
+                array_col = recursiveRemoveLowCardinality(aray_col_concrete_const->convertToFullColumn());
+                array_col_concrete = checkAndGetColumn<ColumnArray>(array_col.get());
             }
 
-            const DataTypePtr & array_type_ptr = array_with_type_and_name.type;
-            const auto * array_type = checkAndGetDataType<DataTypeArray>(array_type_ptr.get());
-            if (!array_type)
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Expected array type, found {}", array_type_ptr->getName());
+            const DataTypePtr & array_type = array_with_type_and_name.type;
+            const auto * array_type_concrete = checkAndGetDataType<DataTypeArray>(array_type.get());
+            if (!array_type_concrete)
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Expected array type, found {}", array_type->getName());
 
-            if (!offsets_column)
-                offsets_column = column_array->getOffsetsPtr();
+            /// Check that the cardinality of the arrays across a row is the same for all array arguments.
+            /// This simplifies later calculations which can work only with the offsets of the first column.
+            if (!first_array_col_offsets)
+                first_array_col_offsets = array_col_concrete->getOffsetsPtr();
             else
             {
-                /// The first condition is optimization: do not compare data if the pointers are equal.
-                if (column_array->getOffsetsPtr() != offsets_column
-                    && column_array->getOffsets() != typeid_cast<const ColumnArray::ColumnOffsets &>(*offsets_column).getData())
-                    throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH, "Arrays passed to {} must have equal size", getName());
+                /// It suffices to check that the internal offset columns are equal.
+                /// The first condition is optimization: skip comparison if the offset pointers are equal.
+                if (array_col_concrete->getOffsetsPtr() != first_array_col_offsets
+                    && array_col_concrete->getOffsets() != typeid_cast<const ColumnArray::ColumnOffsets &>(*first_array_col_offsets).getData())
+                    throw Exception(ErrorCodes::SIZES_OF_ARRAYS_DONT_MATCH, "arrays_data_with_type_and_name passed to {} must have equal size", getName());
             }
+
             if (i == 1)
             {
-                column_first_array_ptr = column_array_ptr;
-                column_first_array = column_array;
+                first_array_col = array_col;
+                first_array_col_concrete = array_col_concrete;
             }
-            arrays.emplace_back(ColumnWithTypeAndName(column_array->getDataPtr(),
-                                                      recursiveRemoveLowCardinality(array_type->getNestedType()),
-                                                      array_with_type_and_name.name));
+
+            ColumnWithTypeAndName data_type_name(array_col_concrete->getDataPtr(), recursiveRemoveLowCardinality(array_type_concrete->getNestedType()), array_with_type_and_name.name);
+            arrays_data_with_type_and_name.push_back(data_type_name);
         }
 
-        ssize_t rows_count = input_rows_count;
-        ssize_t data_row_count = arrays[0].column->size();
-        size_t array_count = arrays.size();
+        const ssize_t num_rows = input_rows_count; /// how many rows are processed
+        const size_t num_array_cols = arrays_data_with_type_and_name.size(); /// number of given array arguments
+        const ssize_t num_elements_in_array_col = arrays_data_with_type_and_name[0].column->size(); /// total number of array elements in the 1st array argument (the value is the same for other array arguments)
 
-        if (rows_count == 0)
+        if (num_rows == 0)
             return arguments.back().column->convertToFullColumnIfConst()->cloneEmpty();
 
-        ColumnPtr current_column = arguments.back().column->convertToFullColumnIfConst();
-        MutableColumnPtr result_data = arguments.back().column->convertToFullColumnIfConst()->cloneEmpty();
+        const auto & offsets = first_array_col_concrete->getOffsets(); /// the internal offsets column of the first array argument (other array arguments have the same offsets)
 
-        size_t max_array_size = 0;
-        const auto & offsets = column_first_array->getOffsets();
+        /// Find the first row which contains a non-empty array
+        ssize_t first_row_with_non_empty_array = 0;
+        if (num_elements_in_array_col)
+            while (offsets[first_row_with_non_empty_array] == 0)
+                ++first_row_with_non_empty_array;
 
-        IColumn::Selector selector(data_row_count);
-        size_t cur_ind = 0;
-        ssize_t cur_arr = 0;
-
-        /// skip to the first non empty array
-        if (data_row_count)
-            while (offsets[cur_arr] == 0)
-                ++cur_arr;
-
-        /// selector[i] is an index that i_th data element has in an array it corresponds to
-        for (ssize_t i = 0; i < data_row_count; ++i)
+        /// Build a selector which stores for every array element in the first array argument if the array element is the 0th, 1st, ... (horizontal) array element in the current row
+        /// Better explained by an example:
+        ///             0        1      <-- horizontal position
+        ///   row0: ['elem1']
+        ///   row1: ['elem2', 'elem3']
+        ///   row2: ['elem4']
+        ///   --> Selector will contain [0, 0, 1, 0].
+        IColumn::Selector selector(num_elements_in_array_col);
+        size_t max_array_size = 0; /// cardinality of the array with the most elements in the first array argument
+        size_t cur_element_in_cur_array = 0;
+        for (ssize_t i = 0; i < num_elements_in_array_col; ++i)
         {
-            selector[i] = cur_ind;
-            cur_ind++;
-            if (cur_ind > max_array_size)
-                max_array_size = cur_ind;
-            while (cur_arr < rows_count && cur_ind >= offsets[cur_arr] - offsets[cur_arr - 1])
+            selector[i] = cur_element_in_cur_array;
+            ++cur_element_in_cur_array;
+            if (cur_element_in_cur_array > max_array_size)
+                max_array_size = cur_element_in_cur_array;
+            while (first_row_with_non_empty_array < num_rows && cur_element_in_cur_array >= offsets[first_row_with_non_empty_array] - offsets[first_row_with_non_empty_array - 1])
             {
-                ++cur_arr;
-                cur_ind = 0;
+                ++first_row_with_non_empty_array;
+                cur_element_in_cur_array = 0;
             }
         }
 
-        std::vector<MutableColumns> data_arrays;
-        data_arrays.resize(array_count);
-
-        /// Split each data column to columns containing elements of only Nth index in array
+        /// Based on the selector, scatter elements of the arrays on all rows into vertical slices
+        /// Example:
+        ///   row0: ['elem1']
+        ///   row1: ['elem2', 'elem3']
+        ///   row2: ['elem4']
+        ///   --> create two slices based on selector [0, 0, 1, 0]
+        ///       - slice0: 'elem1', 'elem2', 'elem4''
+        ///       - slice1: 'elem3'
+        std::vector<MutableColumns> vertical_slices; /// contains for every array argument, a vertical slice for the 0th array element, a vertical slice for the 1st array element, ...
+        vertical_slices.resize(num_array_cols);
         if (max_array_size > 0)
-            for (size_t i = 0; i < array_count; ++i)
-                data_arrays[i] = arrays[i].column->scatter(max_array_size, selector);
+            for (size_t i = 0; i < num_array_cols; ++i)
+                vertical_slices[i] = arrays_data_with_type_and_name[i].column->scatter(max_array_size, selector);
 
-        size_t prev_size = rows_count;
+        ColumnPtr accumulator_col = arguments.back().column->convertToFullColumnIfConst();
+        MutableColumnPtr result_col = accumulator_col->cloneEmpty();
+        ColumnPtr lambda_col = lambda_function->cloneResized(num_rows);
 
-        IColumn::Permutation inverse_permutation(rows_count);
-        size_t inverse_permutation_count = 0;
+        IColumn::Permutation inverse_permutation(num_rows);
+        size_t num_inverse_permutations = 0;
 
-        /// current_column after each iteration contains value of accumulator after applying values under indexes of arrays.
-        /// At each iteration only rows of current_column with arrays that still has unapplied elements are kept.
-        /// Discarded rows which contain finished calculations are added to result_data column and as we insert them we save their original row_number in inverse_permutation vector
-        for (size_t ind = 0; ind < max_array_size; ++ind)
+        /// Iterate the slices. The accumulator value of a row is updated iff the array in the row has at least slice_i-many elements. Since
+        /// slices become incrementally smaller, fewer and fewer accumulator values are updated in each iteration. Once the calculation for
+        /// a row is finished (i.e. there are no more slices to process), it is added to the result. Since that happens in random order,
+        /// we also maintain a mapping to reconstruct the right result order at the end.
+        size_t unfinished_rows = num_rows; /// number of rows to consider in the current iteration
+        for (size_t slice = 0; slice < max_array_size; ++slice)
         {
-            IColumn::Selector prev_selector(prev_size);
-            size_t prev_ind = 0;
-            for (ssize_t irow = 0; irow < rows_count; ++irow)
+            IColumn::Selector prev_selector(unfinished_rows); /// 1 for rows which have slice_i-many elements, otherwise 0
+            size_t prev_index = 0;
+            for (ssize_t row = 0; row < num_rows; ++row)
             {
-                if (offsets[irow] - offsets[irow - 1] > ind)
-                    prev_selector[prev_ind++] = 1;
-                else if (offsets[irow] - offsets[irow - 1] == ind)
+                size_t num_elements = offsets[row] - offsets[row - 1]; /// cardinality of array on the row
+                if (num_elements > slice)
                 {
-                    inverse_permutation[inverse_permutation_count++] = irow;
-                    prev_selector[prev_ind++] = 0;
+                    prev_selector[prev_index] = 1;
+                    ++prev_index;
+                }
+                else if (num_elements == slice)
+                {
+                    prev_selector[prev_index] = 0;
+                    ++prev_index;
+                    inverse_permutation[num_inverse_permutations] = row;
+                    ++num_inverse_permutations;
                 }
             }
-            auto prev = current_column->scatter(2, prev_selector);
 
-            result_data->insertRangeFrom(*(prev[0]), 0, prev[0]->size());
+            /// Scatter the accumulator into two columns
+            /// - one column with accumulator values for rows less than slice-many elements, no further calculation is performed on them
+            /// - one column with accumulator values for rows with slice-many or more elements, these are updated in this or following iteration
+            std::vector<IColumn::MutablePtr> finished_unfinished_accumulator_values = accumulator_col->scatter(2, prev_selector);
+            IColumn::MutablePtr & finished_accumulator_values = finished_unfinished_accumulator_values[0];
+            IColumn::MutablePtr & unfinished_accumulator_values = finished_unfinished_accumulator_values[1];
 
-            auto res_lambda = lambda_function->cloneResized(prev[1]->size());
-            auto * res_lambda_ptr = typeid_cast<ColumnFunction *>(res_lambda.get());
+            /// Copy finished accumulator values into the result
+            result_col->insertRangeFrom(*finished_accumulator_values, 0, finished_accumulator_values->size());
 
-            res_lambda_ptr->appendArguments(std::vector({ColumnWithTypeAndName(std::move(prev[1]), arguments.back().type, arguments.back().name)}));
-            for (size_t i = 0; i < array_count; i++)
-                res_lambda_ptr->appendArguments(std::vector({ColumnWithTypeAndName(std::move(data_arrays[i][ind]), arrays[i].type, arrays[i].name)}));
+            /// The lambda function can contain statically bound arguments, in particular their row values. We need to filter for the rows
+            /// we care about.
+            IColumn::Filter filter(unfinished_rows);
+            for (size_t i = 0; i < prev_selector.size(); ++i)
+                filter[i] = prev_selector[i];
+            ColumnPtr lambda_col_filtered = lambda_col->filter(filter, lambda_col->size());
+            IColumn::MutablePtr lambda_col_filtered_cloned = lambda_col_filtered->cloneResized(lambda_col_filtered->size()); /// clone so we can bind more arguments
+            auto * lambda = typeid_cast<ColumnFunction *>(lambda_col_filtered_cloned.get());
 
-            current_column = IColumn::mutate(res_lambda_ptr->reduce().column);
-            prev_size = current_column->size();
+            /// Bind arguments to lambda function (accumulator + array arguments)
+            lambda->appendArguments(std::vector({ColumnWithTypeAndName(std::move(unfinished_accumulator_values), arguments.back().type, arguments.back().name)}));
+            for (size_t array_col = 0; array_col < num_array_cols; ++array_col)
+                lambda->appendArguments(std::vector({ColumnWithTypeAndName(std::move(vertical_slices[array_col][slice]), arrays_data_with_type_and_name[array_col].type, arrays_data_with_type_and_name[array_col].name)}));
+
+            /// Perform the actual calculation and copy the result into the accumulator
+            ColumnWithTypeAndName res_with_type_and_name = lambda->reduce();
+            accumulator_col = res_with_type_and_name.column->convertToFullColumnIfConst();
+
+            unfinished_rows = accumulator_col->size();
+            lambda_col = lambda_col_filtered;
         }
 
-        result_data->insertRangeFrom(*current_column, 0, current_column->size());
-        for (ssize_t irow = 0; irow < rows_count; ++irow)
-            if (offsets[irow] - offsets[irow - 1] == max_array_size)
-                inverse_permutation[inverse_permutation_count++] = irow;
+        /// Copy accumulator values of last iteration into result.
+        result_col->insertRangeFrom(*accumulator_col, 0, accumulator_col->size());
 
-        /// We have result_data containing result for every row and inverse_permutation which contains indexes of rows in input it corresponds to.
-        /// Now we need to invert inverse_permuation and apply it to result_data to get rows in right order.
-        IColumn::Permutation perm(rows_count);
-        for (ssize_t i = 0; i < rows_count; i++)
-            perm[inverse_permutation[i]] = i;
-        return result_data->permute(perm, 0);
+        for (ssize_t row = 0; row < num_rows; ++row)
+        {
+            size_t num_elements = offsets[row] - offsets[row - 1]; /// cardinality of array on the row
+            if (num_elements == max_array_size)
+            {
+                inverse_permutation[num_inverse_permutations] = row;
+                ++num_inverse_permutations;
+            }
+        }
+
+        /// We have result_col containing result for every row and inverse_permutation which contains indexes of rows in input it corresponds to.
+        /// Now we need to invert inverse_permuation and apply it to result_col to get rows in right order.
+        IColumn::Permutation perm(num_rows);
+        for (ssize_t row = 0; row < num_rows; ++row)
+            perm[inverse_permutation[row]] = row;
+        return result_col->permute(perm, 0);
     }
 
 private:
@@ -228,9 +282,9 @@ private:
 
 REGISTER_FUNCTION(ArrayFold)
 {
-    factory.registerFunction<ArrayFold>(FunctionDocumentation{.description=R"(
-        Function arrayFold(x1,...,xn,accum -> expression, array1,...,arrayn, accum_initial) applies lambda function to a number of equally-sized arrays
-        and collects the result in an accumulator.
-        )", .examples{{"sum", "SELECT arrayFold(x,acc -> acc+x, [1,2,3,4], toInt64(1));", "11"}}, .categories{"Array"}});
+    factory.registerFunction<FunctionArrayFold>(FunctionDocumentation{.description=R"(
+        Function arrayFold(acc,a1,...,aN->expr, arr1, ..., arrN, acc_initial) applies a lambda function to each element
+        in each (equally-sized) array and collects the result in an accumulator.
+        )", .examples{{"sum", "SELECT arrayFold(acc,x->acc+x, [1,2,3,4], toInt64(1));", "11"}}, .categories{"Array"}});
 }
 }
diff --git a/src/Functions/concat.cpp b/src/Functions/concat.cpp
index 6403c4b8416..b057e7fede5 100644
--- a/src/Functions/concat.cpp
+++ b/src/Functions/concat.cpp
@@ -7,10 +7,10 @@
 #include <Functions/GatherUtils/Sinks.h>
 #include <Functions/GatherUtils/Sources.h>
 #include <Functions/IFunction.h>
+#include <Functions/formatString.h>
 #include <IO/WriteHelpers.h>
 #include <base/map.h>
 
-#include "formatString.h"
 
 namespace DB
 {
@@ -145,13 +145,13 @@ private:
                 }
                 write_helper.finalize();
 
-                /// Same as the normal `ColumnString` branch
-                has_column_string = true;
-                data[i] = &converted_col_str->getChars();
-                offsets[i] = &converted_col_str->getOffsets();
-
                 /// Keep the pointer alive
                 converted_col_ptrs[i] = std::move(converted_col_str);
+
+                /// Same as the normal `ColumnString` branch
+                has_column_string = true;
+                data[i] = &converted_col_ptrs[i]->getChars();
+                offsets[i] = &converted_col_ptrs[i]->getOffsets();
             }
         }
 
diff --git a/src/Functions/concatWithSeparator.cpp b/src/Functions/concatWithSeparator.cpp
index f295d86943f..b4f3732710f 100644
--- a/src/Functions/concatWithSeparator.cpp
+++ b/src/Functions/concatWithSeparator.cpp
@@ -4,11 +4,11 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
+#include <Functions/formatString.h>
 #include <IO/WriteHelpers.h>
 #include <base/map.h>
 #include <base/range.h>
 
-#include "formatString.h"
 
 namespace DB
 {
diff --git a/src/Functions/dateDiff.cpp b/src/Functions/dateDiff.cpp
index c9c9020f068..f75e6eb4fc8 100644
--- a/src/Functions/dateDiff.cpp
+++ b/src/Functions/dateDiff.cpp
@@ -412,14 +412,14 @@ private:
 };
 
 
-/** TimeDiff(t1, t2)
+/** timeDiff(t1, t2)
   * t1 and t2 can be Date or DateTime
   */
 class FunctionTimeDiff : public IFunction
 {
     using ColumnDateTime64 = ColumnDecimal<DateTime64>;
 public:
-    static constexpr auto name = "TimeDiff";
+    static constexpr auto name = "timeDiff";
     static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionTimeDiff>(); }
 
     String getName() const override
diff --git a/src/Functions/date_trunc.cpp b/src/Functions/date_trunc.cpp
index 414512fc4f8..c3903fef137 100644
--- a/src/Functions/date_trunc.cpp
+++ b/src/Functions/date_trunc.cpp
@@ -47,7 +47,7 @@ public:
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "First argument for function {} must be constant string: "
                     "name of datepart", getName());
 
-            datepart_param = datepart_column->getValue<String>();
+            datepart_param = Poco::toLower(datepart_column->getValue<String>());
             if (datepart_param.empty())
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "First argument (name of datepart) for function {} cannot be empty",
                     getName());
diff --git a/src/Functions/decrypt.cpp b/src/Functions/decrypt.cpp
index 1a2d5e2b621..6ad58b959e9 100644
--- a/src/Functions/decrypt.cpp
+++ b/src/Functions/decrypt.cpp
@@ -5,6 +5,9 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsAES.h>
 
+namespace DB
+{
+
 namespace
 {
 
@@ -17,9 +20,6 @@ struct DecryptImpl
 
 }
 
-namespace DB
-{
-
 REGISTER_FUNCTION(Decrypt)
 {
     factory.registerFunction<FunctionDecrypt<DecryptImpl>>();
diff --git a/src/Functions/encrypt.cpp b/src/Functions/encrypt.cpp
index 38feafbea19..d76148f2176 100644
--- a/src/Functions/encrypt.cpp
+++ b/src/Functions/encrypt.cpp
@@ -5,6 +5,9 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionsAES.h>
 
+namespace DB
+{
+
 namespace
 {
 
@@ -16,9 +19,6 @@ struct EncryptImpl
 
 }
 
-namespace DB
-{
-
 REGISTER_FUNCTION(Encrypt)
 {
     factory.registerFunction<FunctionEncrypt<EncryptImpl>>();
diff --git a/src/Functions/formatString.cpp b/src/Functions/format.cpp
similarity index 71%
rename from src/Functions/formatString.cpp
rename to src/Functions/format.cpp
index 8e0b3a238cb..036ff9f0c57 100644
--- a/src/Functions/formatString.cpp
+++ b/src/Functions/format.cpp
@@ -1,35 +1,33 @@
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnString.h>
+#include <Columns/ColumnStringHelpers.h>
 #include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/IFunction.h>
+#include <Functions/formatString.h>
 #include <IO/WriteHelpers.h>
-#include <base/range.h>
 
 #include <memory>
 #include <string>
 #include <vector>
 
-#include "formatString.h"
 
 namespace DB
 {
 namespace ErrorCodes
 {
     extern const int ILLEGAL_COLUMN;
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
 }
 
 namespace
 {
 
-template <typename Name>
 class FormatFunction : public IFunction
 {
 public:
-    static constexpr auto name = Name::name;
+    static constexpr auto name = "format";
 
     static FunctionPtr create(ContextPtr) { return std::make_shared<FormatFunction>(); }
 
@@ -41,6 +39,7 @@ public:
 
     size_t getNumberOfArguments() const override { return 0; }
 
+    bool useDefaultImplementationForConstants() const override { return true; }
     ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {0}; }
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
@@ -52,18 +51,6 @@ public:
                 getName(),
                 arguments.size());
 
-        for (const auto arg_idx : collections::range(0, arguments.size()))
-        {
-            const auto * arg = arguments[arg_idx].get();
-            if (!isStringOrFixedString(arg))
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "Illegal type {} of argument {} of function {}",
-                    arg->getName(),
-                    arg_idx + 1,
-                    getName());
-        }
-
         return std::make_shared<DataTypeString>();
     }
 
@@ -83,6 +70,7 @@ public:
         std::vector<const ColumnString::Offsets *> offsets(arguments.size() - 1);
         std::vector<size_t> fixed_string_sizes(arguments.size() - 1);
         std::vector<std::optional<String>> constant_strings(arguments.size() - 1);
+        std::vector<ColumnString::MutablePtr> converted_col_ptrs(arguments.size() - 1);
 
         bool has_column_string = false;
         bool has_column_fixed_string = false;
@@ -106,8 +94,29 @@ public:
                 constant_strings[i - 1] = const_col->getValue<String>();
             }
             else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of argument of function {}",
-                    column->getName(), getName());
+            {
+                /// A non-String/non-FixedString-type argument: use the default serialization to convert it to String
+                auto full_column = column->convertToFullIfNeeded();
+                auto serialization = arguments[i].type->getDefaultSerialization();
+                auto converted_col_str = ColumnString::create();
+                ColumnStringHelpers::WriteHelper write_helper(*converted_col_str, column->size());
+                auto & write_buffer = write_helper.getWriteBuffer();
+                FormatSettings format_settings;
+                for (size_t row = 0; row < column->size(); ++row)
+                {
+                    serialization->serializeText(*full_column, row, write_buffer, format_settings);
+                    write_helper.rowWritten();
+                }
+                write_helper.finalize();
+
+                /// Keep the pointer alive
+                converted_col_ptrs[i - 1] = std::move(converted_col_str);
+
+                /// Same as the normal `ColumnString` branch
+                has_column_string = true;
+                data[i - 1] = &converted_col_ptrs[i - 1]->getChars();
+                offsets[i - 1] = &converted_col_ptrs[i - 1]->getOffsets();
+            }
         }
 
         FormatStringImpl::formatExecute(
@@ -127,11 +136,7 @@ public:
 };
 
 
-struct NameFormat
-{
-    static constexpr auto name = "format";
-};
-using FunctionFormat = FormatFunction<NameFormat>;
+using FunctionFormat = FormatFunction;
 
 }
 
diff --git a/src/Functions/formatReadableDecimalSize.cpp b/src/Functions/formatReadableDecimalSize.cpp
index b6fd0de8f7b..1aa5abc526e 100644
--- a/src/Functions/formatReadableDecimalSize.cpp
+++ b/src/Functions/formatReadableDecimalSize.cpp
@@ -1,5 +1,6 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/formatReadable.h>
+#include <Common/formatReadable.h>
 
 
 namespace DB
diff --git a/src/Functions/formatReadableQuantity.cpp b/src/Functions/formatReadableQuantity.cpp
index 682fac88969..483e8a77a0b 100644
--- a/src/Functions/formatReadableQuantity.cpp
+++ b/src/Functions/formatReadableQuantity.cpp
@@ -1,5 +1,6 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/formatReadable.h>
+#include <Common/formatReadable.h>
 
 
 namespace DB
diff --git a/src/Functions/formatReadableSize.cpp b/src/Functions/formatReadableSize.cpp
index 95441d43b2f..5c11603e9d7 100644
--- a/src/Functions/formatReadableSize.cpp
+++ b/src/Functions/formatReadableSize.cpp
@@ -1,5 +1,6 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/formatReadable.h>
+#include <Common/formatReadable.h>
 
 
 namespace DB
@@ -21,6 +22,7 @@ namespace
 REGISTER_FUNCTION(FormatReadableSize)
 {
     factory.registerFunction<FunctionFormatReadable<Impl>>();
+    factory.registerAlias("FORMAT_BYTES", Impl::name, FunctionFactory::CaseInsensitive);
 }
 
 }
diff --git a/src/Functions/geoToS2.cpp b/src/Functions/geoToS2.cpp
index 8d065b01c34..f27cd26fd9d 100644
--- a/src/Functions/geoToS2.cpp
+++ b/src/Functions/geoToS2.cpp
@@ -101,19 +101,35 @@ public:
             const Float64 lon = data_col_lon[row];
             const Float64 lat = data_col_lat[row];
 
-            if (isNaN(lon) || isNaN(lat))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Arguments must not be NaN");
+            if (isNaN(lon))
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal argument for longitude in function {}. It must not be NaN", getName());
+            if (!isFinite(lon))
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Illegal argument for longitude in function {}. It must not be infinite",
+                    getName());
 
-            if (!(isFinite(lon) && isFinite(lat)))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Arguments must not be infinite");
+            if (isNaN(lat))
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal argument for latitude in function {}. It must not be NaN", getName());
+            if (!isFinite(lat))
+                throw Exception(
+                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Illegal argument for latitude in function {}. It must not be infinite",
+                    getName());
 
-            /// S2 acceptes point as (latitude, longitude)
+            /// S2 accepts point as (latitude, longitude)
             S2LatLng lat_lng = S2LatLng::FromDegrees(lat, lon);
 
             if (!lat_lng.is_valid())
-                throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                    "Point is invalid. For valid point the latitude is between -90 and 90 degrees inclusive"
-                    "and the longitude is between -180 and 180 degrees inclusive.");
+                throw Exception(
+                    ErrorCodes::BAD_ARGUMENTS,
+                    "Point ({}, {}) is invalid in function {}. For valid point the latitude is between -90 and 90 degrees inclusive"
+                    "and the longitude is between -180 and 180 degrees inclusive.",
+                    lon,
+                    lat,
+                    getName());
 
             S2CellId id(lat_lng);
 
diff --git a/src/Functions/getClientHTTPHeader.cpp b/src/Functions/getClientHTTPHeader.cpp
deleted file mode 100644
index 23f6ca5aefa..00000000000
--- a/src/Functions/getClientHTTPHeader.cpp
+++ /dev/null
@@ -1,116 +0,0 @@
-#include <Functions/IFunction.h>
-#include <Functions/FunctionFactory.h>
-#include <Functions/FunctionHelpers.h>
-#include <DataTypes/DataTypeString.h>
-#include <Columns/ColumnString.h>
-#include <Interpreters/Context.h>
-#include <Common/CurrentThread.h>
-#include "Disks/DiskType.h"
-#include "Interpreters/Context_fwd.h"
-#include <Core/Field.h>
-#include <Poco/Net/NameValueCollection.h>
-
-
-namespace DB
-{
-namespace ErrorCodes
-{
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int ILLEGAL_COLUMN;
-    extern const int FUNCTION_NOT_ALLOWED;
-    extern const int BAD_ARGUMENTS;
-}
-
-namespace
-{
-
-/** Get the value of parameter in http headers.
-  * If there no such parameter or the method of request is not
-  * http, the function will throw an exception.
-  */
-class FunctionGetClientHTTPHeader : public IFunction, WithContext
-{
-private:
-
-public:
-    explicit FunctionGetClientHTTPHeader(ContextPtr context_): WithContext(context_) {}
-
-    static constexpr auto name = "getClientHTTPHeader";
-
-    static FunctionPtr create(ContextPtr context_)
-    {
-        return std::make_shared<FunctionGetClientHTTPHeader>(context_);
-    }
-
-    bool useDefaultImplementationForConstants() const override { return true; }
-
-    String getName() const override { return name; }
-
-    bool isDeterministic() const override { return false; }
-
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
-
-
-    size_t getNumberOfArguments() const override
-    {
-        return 1;
-    }
-
-    DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
-    {
-        if (!getContext()->allowGetHTTPHeaderFunction())
-            throw Exception(ErrorCodes::FUNCTION_NOT_ALLOWED, "The function {} is not enabled, you can set allow_get_client_http_header in config file.", getName());
-
-        if (!isString(arguments[0]))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "The argument of function {} must have String type", getName());
-        return std::make_shared<DataTypeString>();
-    }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t input_rows_count) const override
-    {
-        const auto & client_info = getContext()->getClientInfo();
-        const auto & method = client_info.http_method;
-        const auto & headers = client_info.headers;
-        const IColumn * arg_column = arguments[0].column.get();
-        const ColumnString * arg_string = checkAndGetColumn<ColumnString>(arg_column);
-
-        if (!arg_string)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "The argument of function {} must be constant String", getName());
-
-        if (method != ClientInfo::HTTPMethod::GET && method != ClientInfo::HTTPMethod::POST)
-            return result_type->createColumnConstWithDefaultValue(input_rows_count);
-
-        auto result_column = ColumnString::create();
-
-        const String default_value;
-        const std::unordered_set<String> & forbidden_header_list = getContext()->getClientHTTPHeaderForbiddenHeaders();
-
-        for (size_t row = 0; row < input_rows_count; ++row)
-        {
-            auto header_name = arg_string->getDataAt(row).toString();
-
-            if (!headers.has(header_name))
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "{} is not in HTTP request headers.", header_name);
-            else
-            {
-                auto it = forbidden_header_list.find(header_name);
-                if (it != forbidden_header_list.end())
-                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "The header {} is in get_client_http_header_forbidden_headers, you can config it in config file.", header_name);
-
-                const String & value = headers[header_name];
-                result_column->insertData(value.data(), value.size());
-            }
-        }
-
-        return result_column;
-    }
-};
-
-}
-
-REGISTER_FUNCTION(GetHttpHeader)
-{
-    factory.registerFunction<FunctionGetClientHTTPHeader>();
-}
-
-}
diff --git a/src/Functions/h3ToString.cpp b/src/Functions/h3ToString.cpp
index 897329ed9ec..f8a10d5252b 100644
--- a/src/Functions/h3ToString.cpp
+++ b/src/Functions/h3ToString.cpp
@@ -84,7 +84,7 @@ public:
             const UInt64 hindex = data[row];
 
             if (!isValidCell(hindex))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Invalid H3 index: {}", hindex);
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Invalid H3 index: {} in function {}", hindex, getName());
 
             h3ToString(hindex, pos, H3_INDEX_STRING_LENGTH);
 
diff --git a/src/Functions/if.cpp b/src/Functions/if.cpp
index eba1733c683..cae3b720d8b 100644
--- a/src/Functions/if.cpp
+++ b/src/Functions/if.cpp
@@ -23,7 +23,7 @@
 #include <Functions/FunctionIfBase.h>
 #include <Interpreters/castColumn.h>
 #include <Functions/FunctionFactory.h>
-
+#include <type_traits>
 
 namespace DB
 {
@@ -42,7 +42,8 @@ using namespace GatherUtils;
 /** Selection function by condition: if(cond, then, else).
   * cond - UInt8
   * then, else - numeric types for which there is a general type, or dates, datetimes, or strings, or arrays of these types.
-  */
+  * For better performance, try to use branch free code for numeric types(i.e. cond ? a : b --> !!cond * a + !cond * b), except floating point types because of Inf or NaN.
+*/
 
 template <typename ArrayCond, typename ArrayA, typename ArrayB, typename ArrayResult, typename ResultType>
 inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const ArrayB & b, ArrayResult & res)
@@ -55,24 +56,48 @@ inline void fillVectorVector(const ArrayCond & cond, const ArrayA & a, const Arr
     {
         size_t a_index = 0, b_index = 0;
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[b_index++]);
+        {
+            if constexpr (std::is_integral_v<ResultType>)
+            {
+                res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
+                a_index += !!cond[i];
+                b_index += !cond[i];
+            }
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[b_index++]);
+        }
     }
     else if (a_is_short)
     {
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[i]);
+            if constexpr (std::is_integral_v<ResultType>)
+            {
+                res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b[i]);
+                a_index += !!cond[i];
+            }
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b[i]);
     }
     else if (b_is_short)
     {
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index++]);
+            if constexpr (std::is_integral_v<ResultType>)
+            {
+                res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
+                b_index += !cond[i];
+            }
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[b_index++]);
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[i]);
+            if constexpr (std::is_integral_v<ResultType>)
+                res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b[i]);
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b[i]);
     }
 }
 
@@ -85,12 +110,21 @@ inline void fillVectorConstant(const ArrayCond & cond, const ArrayA & a, B b, Ar
     {
         size_t a_index = 0;
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b);
+            if constexpr (std::is_integral_v<ResultType>)
+            {
+                res[i] = !!cond[i] * static_cast<ResultType>(a[a_index]) + (!cond[i]) * static_cast<ResultType>(b);
+                a_index += !!cond[i];
+            }
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a[a_index++]) : static_cast<ResultType>(b);
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
+            if constexpr (std::is_integral_v<ResultType>)
+                res[i] = !!cond[i] * static_cast<ResultType>(a[i]) + (!cond[i]) * static_cast<ResultType>(b);
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a[i]) : static_cast<ResultType>(b);
     }
 }
 
@@ -103,12 +137,21 @@ inline void fillConstantVector(const ArrayCond & cond, A a, const ArrayB & b, Ar
     {
         size_t b_index = 0;
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index++]);
+            if constexpr (std::is_integral_v<ResultType>)
+            {
+                res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[b_index]);
+                b_index += !cond[i];
+            }
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[b_index++]);
     }
     else
     {
         for (size_t i = 0; i < size; ++i)
-            res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);
+            if constexpr (std::is_integral_v<ResultType>)
+                res[i] = !!cond[i] * static_cast<ResultType>(a) + (!cond[i]) * static_cast<ResultType>(b[i]);
+            else
+                res[i] = cond[i] ? static_cast<ResultType>(a) : static_cast<ResultType>(b[i]);
     }
 }
 
diff --git a/src/Functions/jsonMergePatch.cpp b/src/Functions/jsonMergePatch.cpp
index ff790ba86b4..65946721432 100644
--- a/src/Functions/jsonMergePatch.cpp
+++ b/src/Functions/jsonMergePatch.cpp
@@ -102,8 +102,12 @@ namespace
                     throw Exception(ErrorCodes::BAD_ARGUMENTS, "Wrong JSON string to merge. Expected JSON object");
             };
 
-            const auto * first_string = typeid_cast<const ColumnString *>(arguments[0].column.get());
-            if (!first_string)
+            const bool is_first_const = isColumnConst(*arguments[0].column);
+            const auto * first_column_arg_string = is_first_const
+                        ? checkAndGetColumnConstData<ColumnString>(arguments[0].column.get())
+                        : checkAndGetColumn<ColumnString>(arguments[0].column.get());
+
+            if (!first_column_arg_string)
                 throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Arguments of function {} must be strings", getName());
 
             std::vector<rapidjson::Document> merged_jsons;
@@ -112,19 +116,29 @@ namespace
             for (size_t i = 0; i < input_rows_count; ++i)
             {
                 auto & merged_json = merged_jsons.emplace_back(rapidjson::Type::kObjectType, &allocator);
-                parse_json_document(*first_string, merged_json, i);
+                if (is_first_const)
+                    parse_json_document(*first_column_arg_string, merged_json, 0);
+                else
+                    parse_json_document(*first_column_arg_string, merged_json, i);
             }
 
             for (size_t col_idx = 1; col_idx < arguments.size(); ++col_idx)
             {
-                const auto * column_string = typeid_cast<const ColumnString *>(arguments[col_idx].column.get());
-                if (!column_string)
+                const bool is_const = isColumnConst(*arguments[col_idx].column);
+                const auto * column_arg_string = is_const
+                            ? checkAndGetColumnConstData<ColumnString>(arguments[col_idx].column.get())
+                            : checkAndGetColumn<ColumnString>(arguments[col_idx].column.get());
+
+                if (!column_arg_string)
                     throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Arguments of function {} must be strings", getName());
 
                 for (size_t i = 0; i < input_rows_count; ++i)
                 {
                     rapidjson::Document document(&allocator);
-                    parse_json_document(*column_string, document, i);
+                    if (is_const)
+                        parse_json_document(*column_arg_string, document, 0);
+                    else
+                        parse_json_document(*column_arg_string, document, i);
                     merge_objects(merged_jsons[i], document);
                 }
             }
diff --git a/src/Functions/normalizeQuery.cpp b/src/Functions/normalizeQuery.cpp
index b01dac3909a..ad9a8903733 100644
--- a/src/Functions/normalizeQuery.cpp
+++ b/src/Functions/normalizeQuery.cpp
@@ -3,8 +3,6 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionStringToString.h>
 #include <Parsers/queryNormalization.h>
-#include <base/find_symbols.h>
-#include <Common/StringUtils/StringUtils.h>
 
 
 namespace DB
@@ -34,10 +32,12 @@ struct Impl
         for (size_t i = 0; i < size; ++i)
         {
             ColumnString::Offset curr_src_offset = offsets[i];
-            normalizeQueryToPODArray<keep_names>(
+
+            normalizeQueryToPODArray(
                 reinterpret_cast<const char *>(&data[prev_src_offset]),
                 reinterpret_cast<const char *>(&data[curr_src_offset - 1]),
-                res_data);
+                res_data, keep_names);
+
             prev_src_offset = offsets[i];
             res_offsets[i] = res_data.size();
         }
@@ -58,4 +58,3 @@ REGISTER_FUNCTION(NormalizeQuery)
 }
 
 }
-
diff --git a/src/Functions/normalizedQueryHash.cpp b/src/Functions/normalizedQueryHash.cpp
index d2ccb1c016d..63218f28af5 100644
--- a/src/Functions/normalizedQueryHash.cpp
+++ b/src/Functions/normalizedQueryHash.cpp
@@ -4,9 +4,6 @@
 #include <Columns/ColumnsNumber.h>
 #include <Functions/FunctionFactory.h>
 #include <Parsers/queryNormalization.h>
-#include <base/find_symbols.h>
-#include <Common/StringUtils/StringUtils.h>
-#include <Common/SipHash.h>
 
 
 /** The function returns 64bit hash value that is identical for similar queries.
@@ -39,8 +36,10 @@ struct Impl
         for (size_t i = 0; i < size; ++i)
         {
             ColumnString::Offset curr_src_offset = offsets[i];
-            res_data[i] = normalizedQueryHash<keep_names>(
-                reinterpret_cast<const char *>(&data[prev_src_offset]), reinterpret_cast<const char *>(&data[curr_src_offset - 1]));
+            res_data[i] = normalizedQueryHash(
+                reinterpret_cast<const char *>(&data[prev_src_offset]),
+                reinterpret_cast<const char *>(&data[curr_src_offset - 1]),
+                keep_names);
             prev_src_offset = offsets[i];
         }
     }
@@ -104,4 +103,3 @@ REGISTER_FUNCTION(NormalizedQueryHash)
 }
 
 }
-
diff --git a/src/Functions/now64.cpp b/src/Functions/now64.cpp
index 349b8c71145..0f1e8a04236 100644
--- a/src/Functions/now64.cpp
+++ b/src/Functions/now64.cpp
@@ -30,7 +30,7 @@ Field nowSubsecond(UInt32 scale)
 
     timespec spec{};
     if (clock_gettime(CLOCK_REALTIME, &spec))
-        throwFromErrno("Cannot clock_gettime.", ErrorCodes::CANNOT_CLOCK_GETTIME);
+        throw ErrnoException(ErrorCodes::CANNOT_CLOCK_GETTIME, "Cannot clock_gettime");
 
     DecimalUtils::DecimalComponents<DateTime64> components{spec.tv_sec, spec.tv_nsec};
 
diff --git a/src/Functions/randDistribution.cpp b/src/Functions/randDistribution.cpp
index db101486de8..4e616ada697 100644
--- a/src/Functions/randDistribution.cpp
+++ b/src/Functions/randDistribution.cpp
@@ -1,7 +1,8 @@
 #include <Functions/IFunction.h>
 #include <Functions/FunctionHelpers.h>
 #include <Functions/FunctionFactory.h>
-#include "Common/Exception.h"
+#include <Common/Exception.h>
+#include <Common/thread_local_rng.h>
 #include <Common/NaNUtils.h>
 #include <Columns/ColumnConst.h>
 #include <Columns/ColumnsNumber.h>
diff --git a/src/Functions/reverseDNSQuery.cpp b/src/Functions/reverseDNSQuery.cpp
deleted file mode 100644
index b4d963a6a15..00000000000
--- a/src/Functions/reverseDNSQuery.cpp
+++ /dev/null
@@ -1,118 +0,0 @@
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnArray.h>
-#include <Functions/FunctionFactory.h>
-#include <Functions/IFunction.h>
-#include <DataTypes/DataTypeString.h>
-#include <DataTypes/DataTypeArray.h>
-#include <Common/DNSResolver.h>
-#include <Poco/Net/IPAddress.h>
-#include <Interpreters/Context.h>
-#include <Poco/Util/AbstractConfiguration.h>
-
-namespace DB
-{
-
-namespace ErrorCodes
-{
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
-    extern const int BAD_ARGUMENTS;
-    extern const int FUNCTION_NOT_ALLOWED;
-}
-
-class ReverseDNSQuery : public IFunction
-{
-public:
-    static constexpr auto name = "reverseDNSQuery";
-    static constexpr auto allow_function_config_name = "allow_reverse_dns_query_function";
-
-    static FunctionPtr create(ContextPtr)
-    {
-        return std::make_shared<ReverseDNSQuery>();
-    }
-
-    String getName() const override
-    {
-        return name;
-    }
-
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & data_type, size_t input_rows_count) const override
-    {
-        if (!Context::getGlobalContextInstance()->getConfigRef().getBool(allow_function_config_name, false))
-        {
-            throw Exception(ErrorCodes::FUNCTION_NOT_ALLOWED, "Function {} is not allowed because {} is not set", name, allow_function_config_name);
-        }
-
-        if (arguments.empty())
-        {
-            throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Function {} requires at least one argument", name);
-        }
-
-        auto res_type = getReturnTypeImpl({data_type});
-
-        if (input_rows_count == 0u)
-        {
-            return res_type->createColumnConstWithDefaultValue(input_rows_count);
-        }
-
-        if (!isString(arguments[0].type))
-        {
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "Function {} requires the input column to be of type String", name);
-        }
-
-        auto input_column = arguments[0].column;
-
-        auto ip_address = Poco::Net::IPAddress(input_column->getDataAt(0).toString());
-
-        auto ptr_records = DNSResolver::instance().reverseResolve(ip_address);
-
-        if (ptr_records.empty())
-            return res_type->createColumnConstWithDefaultValue(input_rows_count);
-
-        Array res;
-
-        for (const auto & ptr_record : ptr_records)
-        {
-            res.push_back(ptr_record);
-        }
-
-        return res_type->createColumnConst(input_rows_count, res);
-    }
-
-    bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override
-    {
-        return false;
-    }
-
-    size_t getNumberOfArguments() const override
-    {
-        return 1u;
-    }
-
-    DataTypePtr getReturnTypeImpl(const DataTypes & /*arguments*/) const override
-    {
-        return std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>());
-    }
-
-};
-
-
-REGISTER_FUNCTION(ReverseDNSQuery)
-{
-    factory.registerFunction<ReverseDNSQuery>(
-            FunctionDocumentation{
-                .description = R"(Performs a reverse DNS query to get the PTR records associated with the IP address)",
-                .syntax = "reverseDNSQuery(address)",
-                .arguments = {{"address", "An IPv4 or IPv6 address. [String](../../sql-reference/data-types/string.md)"}},
-                .returned_value = "Associated domains (PTR records). [String](../../sql-reference/data-types/string.md).",
-                .examples = {{"",
-                              "SELECT reverseDNSQuery('192.168.0.2');",
-R"(
-┌─reverseDNSQuery('192.168.0.2')────────────┐
-│ ['test2.example.com','test3.example.com'] │
-└───────────────────────────────────────────┘
-)"}}
-            }
-    );
-}
-
-}
diff --git a/src/Functions/s2CapContains.cpp b/src/Functions/s2CapContains.cpp
index 9dfbc05a6a0..72e9da69a7d 100644
--- a/src/Functions/s2CapContains.cpp
+++ b/src/Functions/s2CapContains.cpp
@@ -131,16 +131,16 @@ public:
             const auto point = S2CellId(data_point[row]);
 
             if (isNaN(degrees))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Radius of the cap must not be nan");
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Radius of the cap must not be nan in function {}", getName());
 
             if (std::isinf(degrees))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Radius of the cap must not be infinite");
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Radius of the cap must not be infinite in function {}", getName());
 
             if (!center.is_valid())
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Center is not valid");
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Center (id {}) is not valid in function {}", data_center[row], getName());
 
             if (!point.is_valid())
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Point is not valid");
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Point (id {}) is not valid in function {}", data_point[row], getName());
 
             S1Angle angle = S1Angle::Degrees(degrees);
             S2Cap cap(center.ToPoint(), angle);
diff --git a/src/Functions/s2CellsIntersect.cpp b/src/Functions/s2CellsIntersect.cpp
index 1fac5fd6e60..320f3c964a2 100644
--- a/src/Functions/s2CellsIntersect.cpp
+++ b/src/Functions/s2CellsIntersect.cpp
@@ -100,10 +100,12 @@ public:
             const UInt64 id_second = data_id_second[row];
 
             auto first_cell = S2CellId(id_first);
-            auto second_cell = S2CellId(id_second);
+            if (!first_cell.is_valid())
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "First cell (id {}) is not valid in function {}", id_first, getName());
 
-            if (!first_cell.is_valid() || !second_cell.is_valid())
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cell is not valid");
+            auto second_cell = S2CellId(id_second);
+            if (!second_cell.is_valid())
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Second cell (id {}) is not valid in function {}", id_second, getName());
 
             dst_data.emplace_back(S2CellId(id_first).intersects(S2CellId(id_second)));
         }
diff --git a/src/Functions/s2GetNeighbors.cpp b/src/Functions/s2GetNeighbors.cpp
index b200f61315b..a6371b9ff68 100644
--- a/src/Functions/s2GetNeighbors.cpp
+++ b/src/Functions/s2GetNeighbors.cpp
@@ -94,7 +94,7 @@ public:
             S2CellId cell_id(id);
 
             if (!cell_id.is_valid())
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cell is not valid");
+                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cell (id {}) is not valid in function {}", id, getName());
 
             S2CellId neighbors[4];
             cell_id.GetEdgeNeighbors(neighbors);
diff --git a/src/Functions/seriesPeriodDetectFFT.cpp b/src/Functions/seriesPeriodDetectFFT.cpp
index 1b81cbba3c3..61e3319d810 100644
--- a/src/Functions/seriesPeriodDetectFFT.cpp
+++ b/src/Functions/seriesPeriodDetectFFT.cpp
@@ -28,7 +28,6 @@ namespace DB
 {
 namespace ErrorCodes
 {
-extern const int BAD_ARGUMENTS;
 extern const int ILLEGAL_COLUMN;
 }
 
@@ -63,36 +62,49 @@ public:
         return std::make_shared<DataTypeFloat64>();
     }
 
-    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t) const override
+    ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
         ColumnPtr array_ptr = arguments[0].column;
         const ColumnArray * array = checkAndGetColumn<ColumnArray>(array_ptr.get());
 
         const IColumn & src_data = array->getData();
+        const ColumnArray::Offsets & offsets = array->getOffsets();
 
-        auto res = ColumnFloat64::create(1);
+        auto res = ColumnFloat64::create(input_rows_count);
         auto & res_data = res->getData();
 
-        Float64 period;
+        ColumnArray::Offset prev_src_offset = 0;
 
-        if (executeNumber<UInt8>(src_data, period) || executeNumber<UInt16>(src_data, period) || executeNumber<UInt32>(src_data, period)
-            || executeNumber<UInt64>(src_data, period) || executeNumber<Int8>(src_data, period) || executeNumber<Int16>(src_data, period)
-            || executeNumber<Int32>(src_data, period) || executeNumber<Int64>(src_data, period) || executeNumber<Float32>(src_data, period)
-            || executeNumber<Float64>(src_data, period))
+        Float64 period;
+        for (size_t i = 0; i < input_rows_count; ++i)
         {
-            res_data[0] = period;
-            return res;
+            ColumnArray::Offset curr_offset = offsets[i];
+            if (executeNumbers<UInt8>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<UInt16>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<UInt32>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<UInt64>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<Int8>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<Int16>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<Int32>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<Int64>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<Float32>(src_data, period, prev_src_offset, curr_offset)
+                || executeNumbers<Float64>(src_data, period, prev_src_offset, curr_offset))
+            {
+                res_data[i] = period;
+                prev_src_offset = curr_offset;
+            }
+            else
+                throw Exception(
+                    ErrorCodes::ILLEGAL_COLUMN,
+                    "Illegal column {} of first argument of function {}",
+                    arguments[0].column->getName(),
+                    getName());
         }
-        else
-            throw Exception(
-                ErrorCodes::ILLEGAL_COLUMN,
-                "Illegal column {} of first argument of function {}",
-                arguments[0].column->getName(),
-                getName());
+        return res;
     }
 
     template <typename T>
-    bool executeNumber(const IColumn & src_data, Float64 & period) const
+    bool executeNumbers(const IColumn & src_data, Float64 & period, ColumnArray::Offset & start, ColumnArray::Offset & end) const
     {
         const ColumnVector<T> * src_data_concrete = checkAndGetColumn<ColumnVector<T>>(&src_data);
         if (!src_data_concrete)
@@ -100,11 +112,15 @@ public:
 
         const PaddedPODArray<T> & src_vec = src_data_concrete->getData();
 
-        size_t len = src_vec.size();
+        chassert(start <= end);
+        size_t len = end - start;
         if (len < 4)
-            throw Exception(ErrorCodes::BAD_ARGUMENTS, "At least four data points are needed for function {}", getName());
+        {
+            period = NAN; // At least four data points are required to detect period
+            return true;
+        }
 
-        std::vector<Float64> src(src_vec.begin(), src_vec.end());
+        std::vector<Float64> src((src_vec.begin() + start), (src_vec.begin() + end));
         std::vector<std::complex<double>> out((len / 2) + 1);
 
         pocketfft::shape_t shape{len};
@@ -157,7 +173,54 @@ REGISTER_FUNCTION(SeriesPeriodDetectFFT)
 {
     factory.registerFunction<FunctionSeriesPeriodDetectFFT>(FunctionDocumentation{
         .description = R"(
-Detects period in time series data using FFT.)",
+Finds the period of the given time series data using FFT
+FFT - Fast Fourier transform (https://en.wikipedia.org/wiki/Fast_Fourier_transform)
+
+**Syntax**
+
+``` sql
+seriesPeriodDetectFFT(series);
+```
+
+**Arguments**
+
+- `series` - An array of numeric values
+
+**Returned value**
+
+- A real value equal to the period of time series
+- Returns NAN when number of data points are less than four.
+
+Type: [Float64](../../sql-reference/data-types/float.md).
+
+**Examples**
+
+Query:
+
+``` sql
+SELECT seriesPeriodDetectFFT([1, 4, 6, 1, 4, 6, 1, 4, 6, 1, 4, 6, 1, 4, 6, 1, 4, 6, 1, 4, 6]) AS print_0;
+```
+
+Result:
+
+``` text
+┌───────────print_0──────┐
+│                      3 │
+└────────────────────────┘
+```
+
+``` sql
+SELECT seriesPeriodDetectFFT(arrayMap(x -> abs((x % 6) - 3), range(1000))) AS print_0;
+```
+
+Result:
+
+``` text
+┌─print_0─┐
+│       6 │
+└─────────┘
+```
+)",
         .categories{"Time series analysis"}});
 }
 }
diff --git a/src/Functions/sleep.h b/src/Functions/sleep.h
index 160a8a2afe2..73d58ca6b5b 100644
--- a/src/Functions/sleep.h
+++ b/src/Functions/sleep.h
@@ -10,12 +10,14 @@
 #include <base/sleep.h>
 #include <IO/WriteHelpers.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/ProcessList.h>
 
 
 namespace ProfileEvents
 {
 extern const Event SleepFunctionCalls;
 extern const Event SleepFunctionMicroseconds;
+extern const Event SleepFunctionElapsedMicroseconds;
 }
 
 namespace DB
@@ -43,15 +45,20 @@ class FunctionSleep : public IFunction
 {
 private:
     UInt64 max_microseconds;
+    QueryStatusPtr query_status;
+
 public:
     static constexpr auto name = variant == FunctionSleepVariant::PerBlock ? "sleep" : "sleepEachRow";
     static FunctionPtr create(ContextPtr context)
     {
-        return std::make_shared<FunctionSleep<variant>>(context->getSettingsRef().function_sleep_max_microseconds_per_block);
+        return std::make_shared<FunctionSleep<variant>>(
+            context->getSettingsRef().function_sleep_max_microseconds_per_block,
+            context->getProcessListElementSafe());
     }
 
-    FunctionSleep(UInt64 max_microseconds_)
+    FunctionSleep(UInt64 max_microseconds_, QueryStatusPtr query_status_)
         : max_microseconds(std::min(max_microseconds_, static_cast<UInt64>(std::numeric_limits<UInt32>::max())))
+        , query_status(query_status_)
     {
     }
 
@@ -128,9 +135,23 @@ public:
                         "The maximum sleep time is {} microseconds. Requested: {} microseconds per block (of size {})",
                         max_microseconds, microseconds, size);
 
-                sleepForMicroseconds(microseconds);
+                UInt64 elapsed = 0;
+                while (elapsed < microseconds)
+                {
+                    UInt64 sleep_time = microseconds - elapsed;
+                    if (query_status)
+                        sleep_time = std::min(sleep_time, /* 1 second */ static_cast<UInt64>(1000000));
+
+                    sleepForMicroseconds(sleep_time);
+                    elapsed += sleep_time;
+
+                    if (query_status && !query_status->checkTimeLimit())
+                        break;
+                }
+
                 ProfileEvents::increment(ProfileEvents::SleepFunctionCalls, count);
                 ProfileEvents::increment(ProfileEvents::SleepFunctionMicroseconds, microseconds);
+                ProfileEvents::increment(ProfileEvents::SleepFunctionElapsedMicroseconds, elapsed);
             }
         }
 
diff --git a/src/Functions/stringToH3.cpp b/src/Functions/stringToH3.cpp
index d8728b346d0..94418efdfdf 100644
--- a/src/Functions/stringToH3.cpp
+++ b/src/Functions/stringToH3.cpp
@@ -88,7 +88,7 @@ private:
 
             if (res_data[row_num] == 0)
             {
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Invalid H3 index: {}", h3index_str);
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Invalid H3 index: {} in function {}", h3index_str, name);
             }
 
             h3index_source.next();
diff --git a/src/Functions/substring.cpp b/src/Functions/substring.cpp
index 7678692f612..e3dfdf3de5e 100644
--- a/src/Functions/substring.cpp
+++ b/src/Functions/substring.cpp
@@ -1,15 +1,16 @@
-#include <DataTypes/DataTypeString.h>
-#include <Columns/ColumnString.h>
-#include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnConst.h>
+#include <Columns/ColumnFixedString.h>
+#include <Columns/ColumnString.h>
+#include <DataTypes/DataTypeEnum.h>
+#include <DataTypes/DataTypeString.h>
 #include <Functions/FunctionFactory.h>
 #include <Functions/FunctionHelpers.h>
-#include <Functions/IFunction.h>
+#include <Functions/GatherUtils/Algorithms.h>
 #include <Functions/GatherUtils/GatherUtils.h>
-#include <Functions/GatherUtils/Sources.h>
 #include <Functions/GatherUtils/Sinks.h>
 #include <Functions/GatherUtils/Slices.h>
-#include <Functions/GatherUtils/Algorithms.h>
+#include <Functions/GatherUtils/Sources.h>
+#include <Functions/IFunction.h>
 #include <IO/WriteHelpers.h>
 
 
@@ -20,101 +21,102 @@ using namespace GatherUtils;
 
 namespace ErrorCodes
 {
-    extern const int ILLEGAL_COLUMN;
-    extern const int ILLEGAL_TYPE_OF_ARGUMENT;
-    extern const int ZERO_ARRAY_OR_TUPLE_INDEX;
-    extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+extern const int ILLEGAL_COLUMN;
+extern const int ILLEGAL_TYPE_OF_ARGUMENT;
+extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
+extern const int ZERO_ARRAY_OR_TUPLE_INDEX;
 }
 
 namespace
 {
 
 /// If 'is_utf8' - measure offset and length in code points instead of bytes.
-/// UTF8 variant is not available for FixedString arguments.
 template <bool is_utf8>
 class FunctionSubstring : public IFunction
 {
 public:
     static constexpr auto name = is_utf8 ? "substringUTF8" : "substring";
-    static FunctionPtr create(ContextPtr)
-    {
-        return std::make_shared<FunctionSubstring>();
-    }
-
-    String getName() const override
-    {
-        return name;
-    }
 
+    static FunctionPtr create(ContextPtr) { return std::make_shared<FunctionSubstring>(); }
+    String getName() const override { return name; }
     bool isVariadic() const override { return true; }
     size_t getNumberOfArguments() const override { return 0; }
-
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return true; }
-
     bool useDefaultImplementationForConstants() const override { return true; }
 
     DataTypePtr getReturnTypeImpl(const DataTypes & arguments) const override
     {
-        size_t number_of_arguments = arguments.size();
+        const size_t number_of_arguments = arguments.size();
 
         if (number_of_arguments < 2 || number_of_arguments > 3)
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Number of arguments for function {} doesn't match: "
                             "passed {}, should be 2 or 3", getName(), number_of_arguments);
 
-        if ((is_utf8 && !isString(arguments[0])) || !isStringOrFixedString(arguments[0]))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}",
-                            arguments[0]->getName(), getName());
+        if constexpr (is_utf8)
+        {
+            /// UTF8 variant is not available for FixedString and Enum arguments.
+            if (!isString(arguments[0]))
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Illegal type {} of first argument of function {}, expected String",
+                    arguments[0]->getName(), getName());
+        }
+        else
+        {
+            if (!isStringOrFixedString(arguments[0]) && !isEnum(arguments[0]))
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Illegal type {} of first argument of function {}, expected String, FixedString or Enum",
+                    arguments[0]->getName(), getName());
+        }
 
         if (!isNativeNumber(arguments[1]))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of second argument of function {}",
-                            arguments[1]->getName(), getName());
+            throw Exception(
+                ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "Illegal type {} of second argument of function {}, expected (U)Int*",
+                arguments[1]->getName(), getName());
 
         if (number_of_arguments == 3 && !isNativeNumber(arguments[2]))
-            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of second argument of function {}",
-                            arguments[2]->getName(), getName());
+            throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                "Illegal type {} of second argument of function {}, expected (U)Int*",
+                arguments[2]->getName(), getName());
 
         return std::make_shared<DataTypeString>();
     }
 
     template <typename Source>
-    ColumnPtr executeForSource(const ColumnPtr & column_start, const ColumnPtr & column_length,
-                          const ColumnConst * column_start_const, const ColumnConst * column_length_const,
-                          Int64 start_value, Int64 length_value, Source && source,
-                          size_t input_rows_count) const
+    ColumnPtr executeForSource(const ColumnPtr & column_offset, const ColumnPtr & column_length,
+                          bool column_offset_const, bool column_length_const,
+                          Int64 offset, Int64 length,
+                          Source && source, size_t input_rows_count) const
     {
         auto col_res = ColumnString::create();
 
         if (!column_length)
         {
-            if (column_start_const)
+            if (column_offset_const)
             {
-                if (start_value > 0)
-                    sliceFromLeftConstantOffsetUnbounded(
-                        source, StringSink(*col_res, input_rows_count), static_cast<size_t>(start_value - 1));
-                else if (start_value < 0)
-                    sliceFromRightConstantOffsetUnbounded(
-                        source, StringSink(*col_res, input_rows_count), -static_cast<size_t>(start_value));
+                if (offset > 0)
+                    sliceFromLeftConstantOffsetUnbounded(source, StringSink(*col_res, input_rows_count), static_cast<size_t>(offset - 1));
+                else if (offset < 0)
+                    sliceFromRightConstantOffsetUnbounded(source, StringSink(*col_res, input_rows_count), -static_cast<size_t>(offset));
                 else
                     throw Exception(ErrorCodes::ZERO_ARRAY_OR_TUPLE_INDEX, "Indices in strings are 1-based");
             }
             else
-                sliceDynamicOffsetUnbounded(source, StringSink(*col_res, input_rows_count), *column_start);
+                sliceDynamicOffsetUnbounded(source, StringSink(*col_res, input_rows_count), *column_offset);
         }
         else
         {
-            if (column_start_const && column_length_const)
+            if (column_offset_const && column_length_const)
             {
-                if (start_value > 0)
-                    sliceFromLeftConstantOffsetBounded(
-                        source, StringSink(*col_res, input_rows_count), static_cast<size_t>(start_value - 1), length_value);
-                else if (start_value < 0)
-                    sliceFromRightConstantOffsetBounded(
-                        source, StringSink(*col_res, input_rows_count), -static_cast<size_t>(start_value), length_value);
+                if (offset > 0)
+                    sliceFromLeftConstantOffsetBounded(source, StringSink(*col_res, input_rows_count), static_cast<size_t>(offset - 1), length);
+                else if (offset < 0)
+                    sliceFromRightConstantOffsetBounded(source, StringSink(*col_res, input_rows_count), -static_cast<size_t>(offset), length);
                 else
                     throw Exception(ErrorCodes::ZERO_ARRAY_OR_TUPLE_INDEX, "Indices in strings are 1-based");
             }
             else
-                sliceDynamicOffsetBounded(source, StringSink(*col_res, input_rows_count), *column_start, *column_length);
+                sliceDynamicOffsetBounded(source, StringSink(*col_res, input_rows_count), *column_offset, *column_length);
         }
 
         return col_res;
@@ -122,58 +124,60 @@ public:
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr &, size_t input_rows_count) const override
     {
-        size_t number_of_arguments = arguments.size();
+        const size_t number_of_arguments = arguments.size();
 
         ColumnPtr column_string = arguments[0].column;
-        ColumnPtr column_start = arguments[1].column;
+        ColumnPtr column_offset = arguments[1].column;
         ColumnPtr column_length;
-
         if (number_of_arguments == 3)
             column_length = arguments[2].column;
 
-        const ColumnConst * column_start_const = checkAndGetColumn<ColumnConst>(column_start.get());
+        const ColumnConst * column_offset_const = checkAndGetColumn<ColumnConst>(column_offset.get());
         const ColumnConst * column_length_const = nullptr;
-
         if (number_of_arguments == 3)
             column_length_const = checkAndGetColumn<ColumnConst>(column_length.get());
 
-        Int64 start_value = 0;
-        Int64 length_value = 0;
+        Int64 offset = 0;
+        Int64 length = 0;
 
-        if (column_start_const)
-            start_value = column_start_const->getInt(0);
+        if (column_offset_const)
+            offset = column_offset_const->getInt(0);
         if (column_length_const)
-            length_value = column_length_const->getInt(0);
+            length = column_length_const->getInt(0);
 
         if constexpr (is_utf8)
         {
             if (const ColumnString * col = checkAndGetColumn<ColumnString>(column_string.get()))
-                return executeForSource(column_start, column_length, column_start_const, column_length_const, start_value,
-                                length_value, UTF8StringSource(*col), input_rows_count);
-            else if (const ColumnConst * col_const = checkAndGetColumnConst<ColumnString>(column_string.get()))
-                return executeForSource(column_start, column_length, column_start_const, column_length_const, start_value,
-                                length_value, ConstSource<UTF8StringSource>(*col_const), input_rows_count);
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    arguments[0].column->getName(), getName());
+                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, UTF8StringSource(*col), input_rows_count);
+            if (const ColumnConst * col_const = checkAndGetColumnConst<ColumnString>(column_string.get()))
+                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<UTF8StringSource>(*col_const), input_rows_count);
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", arguments[0].column->getName(), getName());
         }
         else
         {
             if (const ColumnString * col = checkAndGetColumn<ColumnString>(column_string.get()))
-                return executeForSource(column_start, column_length, column_start_const, column_length_const, start_value,
-                                length_value, StringSource(*col), input_rows_count);
-            else if (const ColumnFixedString * col_fixed = checkAndGetColumn<ColumnFixedString>(column_string.get()))
-                return executeForSource(column_start, column_length, column_start_const, column_length_const, start_value,
-                                length_value, FixedStringSource(*col_fixed), input_rows_count);
-            else if (const ColumnConst * col_const = checkAndGetColumnConst<ColumnString>(column_string.get()))
-                return executeForSource(column_start, column_length, column_start_const, column_length_const, start_value,
-                                length_value, ConstSource<StringSource>(*col_const), input_rows_count);
-            else if (const ColumnConst * col_const_fixed = checkAndGetColumnConst<ColumnFixedString>(column_string.get()))
-                return executeForSource(column_start, column_length, column_start_const, column_length_const, start_value,
-                                length_value, ConstSource<FixedStringSource>(*col_const_fixed), input_rows_count);
-            else
-                throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}",
-                    arguments[0].column->getName(), getName());
+                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, StringSource(*col), input_rows_count);
+            if (const ColumnFixedString * col_fixed = checkAndGetColumn<ColumnFixedString>(column_string.get()))
+                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, FixedStringSource(*col_fixed), input_rows_count);
+            if (const ColumnConst * col_const = checkAndGetColumnConst<ColumnString>(column_string.get()))
+                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<StringSource>(*col_const), input_rows_count);
+            if (const ColumnConst * col_const_fixed = checkAndGetColumnConst<ColumnFixedString>(column_string.get()))
+                return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, ConstSource<FixedStringSource>(*col_const_fixed), input_rows_count);
+            if (isEnum(arguments[0].type))
+            {
+                if (const typename DataTypeEnum8::ColumnType * col_enum8 = checkAndGetColumn<typename DataTypeEnum8::ColumnType>(column_string.get()))
+                {
+                    const auto * type_enum8 = assert_cast<const DataTypeEnum8 *>(arguments[0].type.get());
+                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, EnumSource<DataTypeEnum8>(*col_enum8, *type_enum8), input_rows_count);
+                }
+                if (const typename DataTypeEnum16::ColumnType * col_enum16 = checkAndGetColumn<typename DataTypeEnum16::ColumnType>(column_string.get()))
+                {
+                    const auto * type_enum16 = assert_cast<const DataTypeEnum16 *>(arguments[0].type.get());
+                    return executeForSource(column_offset, column_length, column_offset_const, column_length_const, offset, length, EnumSource<DataTypeEnum16>(*col_enum16, *type_enum16), input_rows_count);
+                }
+            }
+
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column {} of first argument of function {}", arguments[0].column->getName(), getName());
         }
     }
 };
@@ -183,8 +187,8 @@ public:
 REGISTER_FUNCTION(Substring)
 {
     factory.registerFunction<FunctionSubstring<false>>({}, FunctionFactory::CaseInsensitive);
-    factory.registerAlias("substr", "substring", FunctionFactory::CaseInsensitive);
-    factory.registerAlias("mid", "substring", FunctionFactory::CaseInsensitive); /// from MySQL dialect
+    factory.registerAlias("substr", "substring", FunctionFactory::CaseInsensitive); // MySQL alias
+    factory.registerAlias("mid", "substring", FunctionFactory::CaseInsensitive); /// MySQL alias
 
     factory.registerFunction<FunctionSubstring<true>>({}, FunctionFactory::CaseSensitive);
 }
diff --git a/src/Functions/toStartOfInterval.cpp b/src/Functions/toStartOfInterval.cpp
index 48f60dddb33..ea0ad139481 100644
--- a/src/Functions/toStartOfInterval.cpp
+++ b/src/Functions/toStartOfInterval.cpp
@@ -1,7 +1,7 @@
-#include <base/arithmeticOverflow.h>
-#include <Common/DateLUTImpl.h>
 #include <Columns/ColumnsDateTime.h>
 #include <Columns/ColumnsNumber.h>
+#include <Common/DateLUTImpl.h>
+#include <Common/IntervalKind.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDate32.h>
 #include <DataTypes/DataTypeDateTime.h>
@@ -11,6 +11,7 @@
 #include <Functions/FunctionFactory.h>
 #include <Functions/IFunction.h>
 #include <IO/WriteHelpers.h>
+#include <base/arithmeticOverflow.h>
 
 
 namespace DB
@@ -24,9 +25,6 @@ namespace ErrorCodes
 }
 
 
-namespace
-{
-
 class FunctionToStartOfInterval : public IFunction
 {
 public:
@@ -34,86 +32,90 @@ public:
 
     static constexpr auto name = "toStartOfInterval";
     String getName() const override { return name; }
-
     bool isVariadic() const override { return true; }
     size_t getNumberOfArguments() const override { return 0; }
     bool isSuitableForShortCircuitArgumentsExecution(const DataTypesWithConstInfo & /*arguments*/) const override { return false; }
-
     bool useDefaultImplementationForConstants() const override { return true; }
     ColumnNumbers getArgumentsThatAreAlwaysConstant() const override { return {1, 2}; }
-
     bool hasInformationAboutMonotonicity() const override { return true; }
-    Monotonicity getMonotonicityForRange(const IDataType &, const Field &, const Field &) const override
-    {
-        return { .is_monotonic = true, .is_always_monotonic = true };
-    }
+    Monotonicity getMonotonicityForRange(const IDataType &, const Field &, const Field &) const override { return { .is_monotonic = true, .is_always_monotonic = true }; }
 
     DataTypePtr getReturnTypeImpl(const ColumnsWithTypeAndName & arguments) const override
     {
-        bool first_argument_is_date = false;
+        bool value_is_date = false;
         auto check_first_argument = [&]
         {
-            if (!isDate(arguments[0].type) && !isDateTime(arguments[0].type) && !isDateTime64(arguments[0].type))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                    "Should be a date or a date with time", arguments[0].type->getName(), getName());
-            first_argument_is_date = isDate(arguments[0].type);
+            const DataTypePtr & type_arg1 = arguments[0].type;
+            if (!isDate(type_arg1) && !isDateTime(type_arg1) && !isDateTime64(type_arg1))
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Illegal type {} of 1st argument of function {}, expected a Date, DateTime or DateTime64",
+                    type_arg1->getName(), getName());
+            value_is_date = isDate(type_arg1);
         };
 
         const DataTypeInterval * interval_type = nullptr;
-        bool result_type_is_date = false;
-        bool result_type_is_datetime = false;
-        bool result_type_is_datetime_64 = false;
-        auto check_interval_argument = [&]
+        enum class ResultType
         {
-            interval_type = checkAndGetDataType<DataTypeInterval>(arguments[1].type.get());
+            Date,
+            DateTime,
+            DateTime64
+        };
+        ResultType result_type;
+        auto check_second_argument = [&]
+        {
+            const DataTypePtr & type_arg2 = arguments[1].type;
+
+            interval_type = checkAndGetDataType<DataTypeInterval>(type_arg2.get());
             if (!interval_type)
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                    "Should be an interval of time", arguments[1].type->getName(), getName());
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "Illegal type {} of 2nd argument of function {}, expected a time interval",
+                    type_arg2->getName(), getName());
+
             switch (interval_type->getKind()) // NOLINT(bugprone-switch-missing-default-case)
             {
                 case IntervalKind::Nanosecond:
                 case IntervalKind::Microsecond:
                 case IntervalKind::Millisecond:
-                    result_type_is_datetime_64 = true;
+                    result_type = ResultType::DateTime64;
                     break;
                 case IntervalKind::Second:
                 case IntervalKind::Minute:
                 case IntervalKind::Hour:
-                case IntervalKind::Day:
-                    result_type_is_datetime = true;
+                case IntervalKind::Day: /// weird why Day leads to DateTime but too afraid to change it
+                    result_type = ResultType::DateTime;
                     break;
                 case IntervalKind::Week:
                 case IntervalKind::Month:
                 case IntervalKind::Quarter:
                 case IntervalKind::Year:
-                    result_type_is_date = true;
+                    result_type = ResultType::Date;
                     break;
             }
         };
 
-        auto check_timezone_argument = [&]
+        auto check_third_argument = [&]
         {
-            if (!isString(arguments[2].type))
-                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal type {} of argument of function {}. "
-                    "This argument is optional and must be a constant string with timezone name",
-                    arguments[2].type->getName(), getName());
-            if (first_argument_is_date && result_type_is_date)
+            const DataTypePtr & type_arg3 = arguments[2].type;
+            if (!isString(type_arg3))
                 throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "The timezone argument of function {} with interval type {} is allowed only when the 1st argument "
-                    "has the type DateTime or DateTime64",
-                        getName(), interval_type->getKind().toString());
+                    "Illegal type {} of 3rd argument of function {}, expected a constant timezone string",
+                    type_arg3->getName(), getName());
+            if (value_is_date && result_type == ResultType::Date) /// weird why this is && instead of || but too afraid to change it
+                throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
+                    "The timezone argument of function {} with interval type {} is allowed only when the 1st argument has type DateTime or DateTimt64",
+                    getName(), interval_type->getKind().toString());
         };
 
         if (arguments.size() == 2)
         {
             check_first_argument();
-            check_interval_argument();
+            check_second_argument();
         }
         else if (arguments.size() == 3)
         {
             check_first_argument();
-            check_interval_argument();
-            check_timezone_argument();
+            check_second_argument();
+            check_third_argument();
         }
         else
         {
@@ -122,25 +124,27 @@ public:
                 getName(), arguments.size());
         }
 
-        if (result_type_is_date)
-            return std::make_shared<DataTypeDate>();
-        else if (result_type_is_datetime)
-            return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
-        else if (result_type_is_datetime_64)
+        switch (result_type)
         {
-            auto scale = 0;
+            case ResultType::Date:
+                return std::make_shared<DataTypeDate>();
+            case ResultType::DateTime:
+                return std::make_shared<DataTypeDateTime>(extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
+            case ResultType::DateTime64:
+            {
+                UInt32 scale = 0;
+                if (interval_type->getKind() == IntervalKind::Nanosecond)
+                    scale = 9;
+                else if (interval_type->getKind() == IntervalKind::Microsecond)
+                    scale = 6;
+                else if (interval_type->getKind() == IntervalKind::Millisecond)
+                    scale = 3;
 
-            if (interval_type->getKind() == IntervalKind::Nanosecond)
-                scale = 9;
-            else if (interval_type->getKind() == IntervalKind::Microsecond)
-                scale = 6;
-            else if (interval_type->getKind() == IntervalKind::Millisecond)
-                scale = 3;
-
-            return std::make_shared<DataTypeDateTime64>(scale, extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
+                return std::make_shared<DataTypeDateTime64>(scale, extractTimeZoneNameFromFunctionArguments(arguments, 2, 0, false));
+            }
         }
 
-        UNREACHABLE();
+        std::unreachable();
     }
 
     ColumnPtr executeImpl(const ColumnsWithTypeAndName & arguments, const DataTypePtr & result_type, size_t /* input_rows_count */) const override
@@ -154,110 +158,106 @@ public:
 
 private:
     ColumnPtr dispatchForTimeColumn(
-        const ColumnWithTypeAndName & time_column, const ColumnWithTypeAndName & interval_column, const DataTypePtr & result_type, const DateLUTImpl & time_zone) const
+        const ColumnWithTypeAndName & time_column, const ColumnWithTypeAndName & interval_column,
+        const DataTypePtr & result_type, const DateLUTImpl & time_zone) const
     {
-        const auto & from_datatype = *time_column.type.get();
+        const auto & time_column_type = *time_column.type.get();
+        const auto & time_column_col = *time_column.column.get();
 
-        if (isDateTime64(from_datatype))
+        if (isDateTime64(time_column_type))
         {
-            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime64>(time_column.column.get());
-            auto scale = assert_cast<const DataTypeDateTime64 &>(from_datatype).getScale();
+            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime64>(time_column_col);
+            auto scale = assert_cast<const DataTypeDateTime64 &>(time_column_type).getScale();
 
             if (time_column_vec)
-                return dispatchForIntervalColumn(assert_cast<const DataTypeDateTime64 &>(from_datatype), *time_column_vec, interval_column, result_type, time_zone, scale);
+                return dispatchForIntervalColumn(assert_cast<const DataTypeDateTime64 &>(time_column_type), *time_column_vec, interval_column, result_type, time_zone, scale);
         }
-        if (isDateTime(from_datatype))
+        else if (isDateTime(time_column_type))
         {
-            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime>(time_column.column.get());
+            const auto * time_column_vec = checkAndGetColumn<ColumnDateTime>(time_column_col);
             if (time_column_vec)
-                return dispatchForIntervalColumn(assert_cast<const DataTypeDateTime &>(from_datatype), *time_column_vec, interval_column, result_type, time_zone);
+                return dispatchForIntervalColumn(assert_cast<const DataTypeDateTime &>(time_column_type), *time_column_vec, interval_column, result_type, time_zone);
         }
-        if (isDate(from_datatype))
+        else if (isDate(time_column_type))
         {
-            const auto * time_column_vec = checkAndGetColumn<ColumnDate>(time_column.column.get());
+            const auto * time_column_vec = checkAndGetColumn<ColumnDate>(time_column_col);
             if (time_column_vec)
-                return dispatchForIntervalColumn(assert_cast<const DataTypeDate &>(from_datatype), *time_column_vec, interval_column, result_type, time_zone);
+                return dispatchForIntervalColumn(assert_cast<const DataTypeDate &>(time_column_type), *time_column_vec, interval_column, result_type, time_zone);
         }
-        if (isDate32(from_datatype))
-        {
-            const auto * time_column_vec = checkAndGetColumn<ColumnDate32>(time_column.column.get());
-            if (time_column_vec)
-                return dispatchForIntervalColumn(assert_cast<const DataTypeDate32 &>(from_datatype), *time_column_vec, interval_column, result_type, time_zone);
-        }
-        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for first argument of function {}. Must contain dates or dates with time", getName());
+        throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "Illegal column for 1st argument of function {}, expected a Date, DateTime or DateTime64", getName());
     }
 
-    template <typename TimeColumnType, typename TimeDataType>
+    template <typename TimeDataType, typename TimeColumnType>
     ColumnPtr dispatchForIntervalColumn(
         const TimeDataType & time_data_type, const TimeColumnType & time_column, const ColumnWithTypeAndName & interval_column,
-        const DataTypePtr & result_type, const DateLUTImpl & time_zone, const UInt16 scale = 1) const
+        const DataTypePtr & result_type, const DateLUTImpl & time_zone, UInt16 scale = 1) const
     {
         const auto * interval_type = checkAndGetDataType<DataTypeInterval>(interval_column.type.get());
         if (!interval_type)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column for second argument of function {}, must be an interval of time.", getName());
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column for 2nd argument of function {}, must be a time interval", getName());
 
         const auto * interval_column_const_int64 = checkAndGetColumnConst<ColumnInt64>(interval_column.column.get());
         if (!interval_column_const_int64)
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column for second argument of function {}, must be a const interval of time.", getName());
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Illegal column for 2nd argument of function {}, must be a const time interval", getName());
 
-        Int64 num_units = interval_column_const_int64->getValue<Int64>();
+        const Int64 num_units = interval_column_const_int64->getValue<Int64>();
         if (num_units <= 0)
-            throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Value for second argument of function {} must be positive.", getName());
+            throw Exception(ErrorCodes::ARGUMENT_OUT_OF_BOUND, "Value for 2nd argument of function {} must be positive", getName());
 
         switch (interval_type->getKind()) // NOLINT(bugprone-switch-missing-default-case)
         {
             case IntervalKind::Nanosecond:
-                return execute<TimeDataType, DataTypeDateTime64, IntervalKind::Nanosecond>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDateTime64, IntervalKind::Nanosecond>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Microsecond:
-                return execute<TimeDataType, DataTypeDateTime64, IntervalKind::Microsecond>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDateTime64, IntervalKind::Microsecond>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Millisecond:
-                return execute<TimeDataType, DataTypeDateTime64, IntervalKind::Millisecond>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDateTime64, IntervalKind::Millisecond>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Second:
-                return execute<TimeDataType, DataTypeDateTime, IntervalKind::Second>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDateTime, IntervalKind::Second>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Minute:
-                return execute<TimeDataType, DataTypeDateTime, IntervalKind::Minute>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDateTime, IntervalKind::Minute>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Hour:
-                return execute<TimeDataType, DataTypeDateTime, IntervalKind::Hour>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDateTime, IntervalKind::Hour>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Day:
-                return execute<TimeDataType, DataTypeDateTime, IntervalKind::Day>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDateTime, IntervalKind::Day>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Week:
-                return execute<TimeDataType, DataTypeDate, IntervalKind::Week>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDate, IntervalKind::Week>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Month:
-                return execute<TimeDataType, DataTypeDate, IntervalKind::Month>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDate, IntervalKind::Month>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Quarter:
-                return execute<TimeDataType, DataTypeDate, IntervalKind::Quarter>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDate, IntervalKind::Quarter>(time_data_type, time_column, num_units, result_type, time_zone, scale);
             case IntervalKind::Year:
-                return execute<TimeDataType, DataTypeDate, IntervalKind::Year>(time_data_type, time_column, num_units, result_type, time_zone, scale);
+                return execute<TimeDataType, TimeColumnType, DataTypeDate, IntervalKind::Year>(time_data_type, time_column, num_units, result_type, time_zone, scale);
         }
 
-        UNREACHABLE();
+        std::unreachable();
     }
 
-    template <typename TimeDataType, typename ToDataType, IntervalKind::Kind unit, typename ColumnType>
-    ColumnPtr execute(const TimeDataType &, const ColumnType & time_column_type, Int64 num_units, const DataTypePtr & result_type, const DateLUTImpl & time_zone, const UInt16 scale) const
+    template <typename TimeDataType, typename TimeColumnType, typename ResultDataType, IntervalKind::Kind unit>
+    ColumnPtr execute(
+        const TimeDataType &, const TimeColumnType & time_column_type, Int64 num_units,
+        const DataTypePtr & result_type, const DateLUTImpl & time_zone, UInt16 scale) const
     {
-        using ToColumnType = typename ToDataType::ColumnType;
-        using ToFieldType = typename ToDataType::FieldType;
+        using ResultColumnType = typename ResultDataType::ColumnType;
+        using ResultFieldType = typename ResultDataType::FieldType;
 
         const auto & time_data = time_column_type.getData();
         size_t size = time_data.size();
 
         auto result_col = result_type->createColumn();
-        auto *col_to = assert_cast<ToColumnType *>(result_col.get());
+        auto * col_to = assert_cast<ResultColumnType *>(result_col.get());
         auto & result_data = col_to->getData();
         result_data.resize(size);
 
         Int64 scale_multiplier = DecimalUtils::scaleMultiplier<DateTime64>(scale);
 
         for (size_t i = 0; i != size; ++i)
-            result_data[i] = static_cast<ToFieldType>(ToStartOfInterval<unit>::execute(time_data[i], num_units, time_zone, scale_multiplier));
+            result_data[i] = static_cast<ResultFieldType>(ToStartOfInterval<unit>::execute(time_data[i], num_units, time_zone, scale_multiplier));
 
         return result_col;
     }
 };
 
-}
-
 REGISTER_FUNCTION(ToStartOfInterval)
 {
     factory.registerFunction<FunctionToStartOfInterval>();
diff --git a/src/Functions/transform.cpp b/src/Functions/transform.cpp
index f1d2b60f1f4..3c9654740f4 100644
--- a/src/Functions/transform.cpp
+++ b/src/Functions/transform.cpp
@@ -91,19 +91,6 @@ namespace
 
             const auto type_arr_from_nested = type_arr_from->getNestedType();
 
-            auto src = tryGetLeastSupertype(DataTypes{type_x, type_arr_from_nested});
-            if (!src
-                /// Compatibility with previous versions, that allowed even UInt64 with Int64,
-                /// regardless of ambiguous conversions.
-                && !isNativeNumber(type_x) && !isNativeNumber(type_arr_from_nested))
-            {
-                throw Exception(
-                    ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT,
-                    "First argument and elements of array "
-                    "of the second argument of function {} must have compatible types",
-                    getName());
-            }
-
             const DataTypeArray * type_arr_to = checkAndGetDataType<DataTypeArray>(arguments[2].get());
 
             if (!type_arr_to)
@@ -766,15 +753,18 @@ namespace
                 }
             }
 
+            WhichDataType which(from_type);
+
             /// Note: Doesn't check the duplicates in the `from` array.
             /// Field may be of Float type, but for the purpose of bitwise equality we can treat them as UInt64
-            if (WhichDataType which(from_type); isNativeNumber(which) || which.isDecimal32() || which.isDecimal64())
+            if (isNativeNumber(which) || which.isDecimal32() || which.isDecimal64() || which.isEnum())
             {
                 cache.table_num_to_idx = std::make_unique<Cache::NumToIdx>();
                 auto & table = *cache.table_num_to_idx;
                 for (size_t i = 0; i < size; ++i)
                 {
-                    if (applyVisitor(FieldVisitorAccurateEquals(), (*cache.from_column)[i], (*from_column_uncasted)[i]))
+                    if (which.isEnum() /// The correctness of strings are already checked by casting them to the Enum type.
+                        || applyVisitor(FieldVisitorAccurateEquals(), (*cache.from_column)[i], (*from_column_uncasted)[i]))
                     {
                         UInt64 key = 0;
                         auto * dst = reinterpret_cast<char *>(&key);
diff --git a/src/Functions/trap.cpp b/src/Functions/trap.cpp
index 6260056ef31..99430f039a4 100644
--- a/src/Functions/trap.cpp
+++ b/src/Functions/trap.cpp
@@ -165,7 +165,7 @@ public:
                         std::uniform_int_distribution<intptr_t>(0x100000000000UL, 0x700000000000UL)(thread_local_rng));
                     void * map = mmap(hint, 4096, PROT_READ | PROT_WRITE, MAP_PRIVATE | MAP_ANONYMOUS, -1, 0);
                     if (MAP_FAILED == map)
-                        throwFromErrno("Allocator: Cannot mmap", ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+                        throw ErrnoException(ErrorCodes::CANNOT_ALLOCATE_MEMORY, "Allocator: Cannot mmap");
                     maps.push_back(map);
                 }
             }
diff --git a/src/Functions/tryDecrypt.cpp b/src/Functions/tryDecrypt.cpp
index eccccb1e4a4..90d10103dd1 100644
--- a/src/Functions/tryDecrypt.cpp
+++ b/src/Functions/tryDecrypt.cpp
@@ -3,8 +3,12 @@
 
 #if USE_SSL
 
-#    include <Functions/FunctionFactory.h>
-#    include <Functions/FunctionsAES.h>
+#include <Functions/FunctionFactory.h>
+#include <Functions/FunctionsAES.h>
+
+
+namespace DB
+{
 
 namespace
 {
@@ -18,9 +22,6 @@ struct TryDecryptImpl
 
 }
 
-namespace DB
-{
-
 REGISTER_FUNCTION(TryDecrypt)
 {
     factory.registerFunction<FunctionDecrypt<TryDecryptImpl>>(FunctionDocumentation{
diff --git a/src/IO/AIO.cpp b/src/IO/AIO.cpp
index 7088be633e5..7a051950f52 100644
--- a/src/IO/AIO.cpp
+++ b/src/IO/AIO.cpp
@@ -46,7 +46,7 @@ AIOContext::AIOContext(unsigned int nr_events)
 {
     ctx = 0;
     if (io_setup(nr_events, &ctx) < 0)
-        DB::throwFromErrno("io_setup failed", DB::ErrorCodes::CANNOT_IOSETUP);
+        throw DB::ErrnoException(DB::ErrorCodes::CANNOT_IOSETUP, "io_setup failed");
 }
 
 AIOContext::~AIOContext()
@@ -137,7 +137,7 @@ AIOContext::AIOContext(unsigned int)
 {
     ctx = io_setup();
     if (ctx < 0)
-        DB::throwFromErrno("io_setup failed", DB::ErrorCodes::CANNOT_IOSETUP);
+        throw DB::ErrnoException(DB::ErrorCodes::CANNOT_IOSETUP, "io_setup failed");
 }
 
 AIOContext::~AIOContext()
diff --git a/src/IO/Archives/IArchiveWriter.h b/src/IO/Archives/IArchiveWriter.h
index d7ff038e7bc..cccc6dc953b 100644
--- a/src/IO/Archives/IArchiveWriter.h
+++ b/src/IO/Archives/IArchiveWriter.h
@@ -13,7 +13,7 @@ class WriteBufferFromFileBase;
 class IArchiveWriter : public std::enable_shared_from_this<IArchiveWriter>, boost::noncopyable
 {
 public:
-    /// Destructors finalizes writing the archive.
+    /// Call finalize() before destructing IArchiveWriter.
     virtual ~IArchiveWriter() = default;
 
     /// Starts writing a file to the archive. The function returns a write buffer,
@@ -26,6 +26,10 @@ public:
     /// This function should be used mostly for debugging purposes.
     virtual bool isWritingFile() const = 0;
 
+    /// Finalizes writing of the archive. This function must be always called at the end of writing.
+    /// (Unless an error appeared and the archive is in fact no longer needed.)
+    virtual void finalize() = 0;
+
     static constexpr const int kDefaultCompressionLevel = -1;
 
     /// Sets compression method and level.
diff --git a/src/IO/Archives/ZipArchiveWriter.cpp b/src/IO/Archives/ZipArchiveWriter.cpp
index b9a696ee2e2..785a5005f87 100644
--- a/src/IO/Archives/ZipArchiveWriter.cpp
+++ b/src/IO/Archives/ZipArchiveWriter.cpp
@@ -6,6 +6,8 @@
 #include <base/errnoToString.h>
 #include <zip.h>
 #include <boost/algorithm/string/predicate.hpp>
+#include <Common/logger_useful.h>
+#include <Poco/Logger.h>
 
 
 namespace DB
@@ -15,86 +17,56 @@ namespace ErrorCodes
     extern const int CANNOT_PACK_ARCHIVE;
     extern const int SUPPORT_IS_DISABLED;
     extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
 }
 
-using RawHandle = zipFile;
 
-
-/// Holds a raw handle, calls acquireRawHandle() in the constructor and releaseRawHandle() in the destructor.
-class ZipArchiveWriter::HandleHolder
+namespace
 {
-public:
-    HandleHolder() = default;
-
-    explicit HandleHolder(const std::shared_ptr<ZipArchiveWriter> & writer_) : writer(writer_), raw_handle(writer->acquireRawHandle()) { }
-
-    ~HandleHolder()
+    void checkResultCodeImpl(int code, const String & file_name)
     {
-        if (raw_handle)
+        if (code >= ZIP_OK)
+            return;
+
+        String message = "Code = ";
+        switch (code)
         {
-            try
-            {
-                int err = zipCloseFileInZip(raw_handle);
-                /// If err == ZIP_PARAMERROR the file is already closed.
-                if (err != ZIP_PARAMERROR)
-                    checkResult(err);
-            }
-            catch (...)
-            {
-                tryLogCurrentException("ZipArchiveWriter");
-            }
-            writer->releaseRawHandle(raw_handle);
+            case ZIP_ERRNO: message += "ERRNO, errno = " + errnoToString(); break;
+            case ZIP_PARAMERROR: message += "PARAMERROR"; break;
+            case ZIP_BADZIPFILE: message += "BADZIPFILE"; break;
+            case ZIP_INTERNALERROR: message += "INTERNALERROR"; break;
+            default: message += std::to_string(code); break;
         }
+        throw Exception(ErrorCodes::CANNOT_PACK_ARCHIVE, "Couldn't pack zip archive: {}, filename={}", message, quoteString(file_name));
     }
-
-    HandleHolder(HandleHolder && src) noexcept
-    {
-        *this = std::move(src);
-    }
-
-    HandleHolder & operator=(HandleHolder && src) noexcept
-    {
-        writer = std::exchange(src.writer, nullptr);
-        raw_handle = std::exchange(src.raw_handle, nullptr);
-        return *this;
-    }
-
-    RawHandle getRawHandle() const { return raw_handle; }
-    std::shared_ptr<ZipArchiveWriter> getWriter() const { return writer; }
-
-    void checkResult(int code) const { writer->checkResult(code); }
-
-private:
-    std::shared_ptr<ZipArchiveWriter> writer;
-    RawHandle raw_handle = nullptr;
-};
+}
 
 
 /// This class represents a WriteBuffer actually returned by writeFile().
 class ZipArchiveWriter::WriteBufferFromZipArchive : public WriteBufferFromFileBase
 {
 public:
-    WriteBufferFromZipArchive(HandleHolder && handle_, const String & filename_)
+    WriteBufferFromZipArchive(std::shared_ptr<ZipArchiveWriter> archive_writer_, const String & filename_)
         : WriteBufferFromFileBase(DBMS_DEFAULT_BUFFER_SIZE, nullptr, 0)
-        , handle(std::move(handle_))
         , filename(filename_)
     {
-        auto compress_method = handle.getWriter()->compression_method;
-        auto compress_level = handle.getWriter()->compression_level;
+        zip_handle = archive_writer_->startWritingFile();
+        archive_writer = archive_writer_;
+
+        auto compress_method = archive_writer_->getCompressionMethod();
+        auto compress_level = archive_writer_->getCompressionLevel();
         checkCompressionMethodIsEnabled(compress_method);
 
         const char * password_cstr = nullptr;
-        const String & password_str = handle.getWriter()->password;
-        if (!password_str.empty())
+        String current_password = archive_writer_->getPassword();
+        if (!current_password.empty())
         {
             checkEncryptionIsEnabled();
-            password_cstr = password_str.c_str();
+            password_cstr = current_password.c_str();
         }
 
-        RawHandle raw_handle = handle.getRawHandle();
-
-        checkResult(zipOpenNewFileInZip3_64(
-            raw_handle,
+        int code = zipOpenNewFileInZip3_64(
+            zip_handle,
             filename_.c_str(),
             /* zipfi= */ nullptr,
             /* extrafield_local= */ nullptr,
@@ -110,21 +82,30 @@ public:
             /* strategy= */ 0,
             password_cstr,
             /* crc_for_crypting= */ 0,
-            /* zip64= */ true));
+            /* zip64= */ true);
+        checkResultCode(code);
     }
 
     ~WriteBufferFromZipArchive() override
     {
         try
         {
-            finalize();
+            closeFile(/* throw_if_error= */ false);
+            endWritingFile();
         }
         catch (...)
         {
-            tryLogCurrentException("ZipArchiveWriter");
+            tryLogCurrentException("WriteBufferFromZipArchive");
         }
     }
 
+    void finalizeImpl() override
+    {
+        next();
+        closeFile(/* throw_if_error= */ true);
+        endWritingFile();
+    }
+
     void sync() override { next(); }
     std::string getFileName() const override { return filename; }
 
@@ -133,110 +114,106 @@ private:
     {
         if (!offset())
             return;
-        RawHandle raw_handle = handle.getRawHandle();
-        int code = zipWriteInFileInZip(raw_handle, working_buffer.begin(), static_cast<uint32_t>(offset()));
-        checkResult(code);
+        chassert(zip_handle);
+        int code = zipWriteInFileInZip(zip_handle, working_buffer.begin(), static_cast<uint32_t>(offset()));
+        checkResultCode(code);
     }
 
-    void checkResult(int code) const { handle.checkResult(code); }
+    void closeFile(bool throw_if_error)
+    {
+        if (zip_handle)
+        {
+            int code = zipCloseFileInZip(zip_handle);
+            zip_handle = nullptr;
+            if (throw_if_error)
+                checkResultCode(code);
+        }
+    }
 
-    HandleHolder handle;
-    String filename;
+    void endWritingFile()
+    {
+        if (auto archive_writer_ptr = archive_writer.lock())
+        {
+            archive_writer_ptr->endWritingFile();
+            archive_writer.reset();
+        }
+    }
+
+    void checkResultCode(int code) const { checkResultCodeImpl(code, filename); }
+
+    std::weak_ptr<ZipArchiveWriter> archive_writer;
+    const String filename;
+    ZipHandle zip_handle;
 };
 
 
-namespace
+/// Provides a set of functions allowing the minizip library to write its output
+/// to a WriteBuffer instead of an ordinary file in the local filesystem.
+class ZipArchiveWriter::StreamInfo
 {
-    /// Provides a set of functions allowing the minizip library to write its output
-    /// to a WriteBuffer instead of an ordinary file in the local filesystem.
-    class StreamFromWriteBuffer
+public:
+    explicit StreamInfo(std::unique_ptr<WriteBuffer> write_buffer_)
+        : write_buffer(std::move(write_buffer_)), start_offset(write_buffer->count())
     {
-    public:
-        static RawHandle open(std::unique_ptr<WriteBuffer> archive_write_buffer)
-        {
-            Opaque opaque{std::move(archive_write_buffer)};
+    }
 
-            zlib_filefunc64_def func_def;
-            func_def.zopen64_file = &StreamFromWriteBuffer::openFileFunc;
-            func_def.zclose_file = &StreamFromWriteBuffer::closeFileFunc;
-            func_def.zread_file = &StreamFromWriteBuffer::readFileFunc;
-            func_def.zwrite_file = &StreamFromWriteBuffer::writeFileFunc;
-            func_def.zseek64_file = &StreamFromWriteBuffer::seekFunc;
-            func_def.ztell64_file = &StreamFromWriteBuffer::tellFunc;
-            func_def.zerror_file = &StreamFromWriteBuffer::testErrorFunc;
-            func_def.opaque = &opaque;
+    ~StreamInfo() = default;
 
-            return zipOpen2_64(
-                /* path= */ nullptr,
-                /* append= */ false,
-                /* globalcomment= */ nullptr,
-                &func_def);
-        }
+    ZipHandle makeZipHandle()
+    {
+        zlib_filefunc64_def func_def;
+        func_def.zopen64_file = &StreamInfo::openFileFunc;
+        func_def.zclose_file = &StreamInfo::closeFileFunc;
+        func_def.zread_file = &StreamInfo::readFileFunc;
+        func_def.zwrite_file = &StreamInfo::writeFileFunc;
+        func_def.zseek64_file = &StreamInfo::seekFunc;
+        func_def.ztell64_file = &StreamInfo::tellFunc;
+        func_def.zerror_file = &StreamInfo::testErrorFunc;
+        func_def.opaque = this;
 
-    private:
-        std::unique_ptr<WriteBuffer> write_buffer;
-        UInt64 start_offset = 0;
+        return zipOpen2_64(
+            /* path= */ nullptr,
+            /* append= */ false,
+            /* globalcomment= */ nullptr,
+            &func_def);
+    }
 
-        struct Opaque
-        {
-            std::unique_ptr<WriteBuffer> write_buffer;
-        };
+    WriteBuffer & getWriteBuffer() { return *write_buffer; }
 
-        static void * openFileFunc(void * opaque, const void *, int)
-        {
-            Opaque & opq = *reinterpret_cast<Opaque *>(opaque);
-            return new StreamFromWriteBuffer(std::move(opq.write_buffer));
-        }
+private:
+    /// We do nothing in openFileFunc() and in closeFileFunc() because we already have `write_buffer` (file is already opened).
+    static void * openFileFunc(void * opaque, const void *, int) { return opaque; }
+    static int closeFileFunc(void *, void *) { return ZIP_OK; }
 
-        explicit StreamFromWriteBuffer(std::unique_ptr<WriteBuffer> write_buffer_)
-            : write_buffer(std::move(write_buffer_)), start_offset(write_buffer->count()) {}
+    static unsigned long writeFileFunc(void * opaque, void *, const void * buf, unsigned long size) // NOLINT(google-runtime-int)
+    {
+        auto * stream_info = reinterpret_cast<StreamInfo *>(opaque);
+        stream_info->write_buffer->write(reinterpret_cast<const char *>(buf), size);
+        return size;
+    }
 
-        ~StreamFromWriteBuffer()
-        {
-            write_buffer->finalize();
-        }
+    static int testErrorFunc(void *, void *) { return ZIP_OK; }
 
-        static int closeFileFunc(void *, void * stream)
-        {
-            delete reinterpret_cast<StreamFromWriteBuffer *>(stream);
-            return ZIP_OK;
-        }
+    static ZPOS64_T tellFunc(void * opaque, void *)
+    {
+        auto * stream_info = reinterpret_cast<StreamInfo *>(opaque);
+        auto pos = stream_info->write_buffer->count() - stream_info->start_offset;
+        return pos;
+    }
 
-        static StreamFromWriteBuffer & get(void * ptr)
-        {
-            return *reinterpret_cast<StreamFromWriteBuffer *>(ptr);
-        }
+    static long seekFunc(void *, void *, ZPOS64_T, int) // NOLINT(google-runtime-int)
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "StreamInfo::seek() is not implemented");
+    }
 
-        static unsigned long writeFileFunc(void *, void * stream, const void * buf, unsigned long size) // NOLINT(google-runtime-int)
-        {
-            auto & strm = get(stream);
-            strm.write_buffer->write(reinterpret_cast<const char *>(buf), size);
-            return size;
-        }
+    static unsigned long readFileFunc(void *, void *, void *, unsigned long) // NOLINT(google-runtime-int)
+    {
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "StreamInfo::readFile() is not implemented");
+    }
 
-        static int testErrorFunc(void *, void *)
-        {
-            return ZIP_OK;
-        }
-
-        static ZPOS64_T tellFunc(void *, void * stream)
-        {
-            auto & strm = get(stream);
-            auto pos = strm.write_buffer->count() - strm.start_offset;
-            return pos;
-        }
-
-        static long seekFunc(void *, void *, ZPOS64_T, int) // NOLINT(google-runtime-int)
-        {
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "StreamFromWriteBuffer::seek must not be called");
-        }
-
-        static unsigned long readFileFunc(void *, void *, void *, unsigned long) // NOLINT(google-runtime-int)
-        {
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "StreamFromWriteBuffer::readFile must not be called");
-        }
-    };
-}
+    std::unique_ptr<WriteBuffer> write_buffer;
+    UInt64 start_offset;
+};
 
 
 ZipArchiveWriter::ZipArchiveWriter(const String & path_to_archive_)
@@ -248,21 +225,42 @@ ZipArchiveWriter::ZipArchiveWriter(const String & path_to_archive_, std::unique_
     : path_to_archive(path_to_archive_), compression_method(MZ_COMPRESS_METHOD_DEFLATE)
 {
     if (archive_write_buffer_)
-        handle = StreamFromWriteBuffer::open(std::move(archive_write_buffer_));
+    {
+        stream_info = std::make_unique<StreamInfo>(std::move(archive_write_buffer_));
+        zip_handle = stream_info->makeZipHandle();
+    }
     else
-        handle = zipOpen64(path_to_archive.c_str(), /* append= */ false);
-    if (!handle)
-        throw Exception(ErrorCodes::CANNOT_PACK_ARCHIVE, "Couldn't create zip archive {}", quoteString(path_to_archive));
+    {
+        zip_handle = zipOpen64(path_to_archive.c_str(), /* append= */ false);
+    }
 
+    if (!zip_handle)
+        throw Exception(ErrorCodes::CANNOT_PACK_ARCHIVE, "Couldn't create zip archive {}", quoteString(path_to_archive));
 }
 
 ZipArchiveWriter::~ZipArchiveWriter()
 {
-    if (handle)
+    if (!finalized)
+    {
+        /// It is totally OK to destroy instance without finalization when an exception occurs.
+        /// However it is suspicious to destroy instance without finalization at the green path.
+        if (!std::uncaught_exceptions() && std::current_exception() == nullptr)
+        {
+            Poco::Logger * log = &Poco::Logger::get("ZipArchiveWriter");
+            LOG_ERROR(log,
+                       "ZipArchiveWriter is not finalized when destructor is called. "
+                       "The zip archive might not be written at all or might be truncated. "
+                       "Stack trace: {}", StackTrace().toString());
+            chassert(false && "ZipArchiveWriter is not finalized in destructor.");
+        }
+    }
+
+    if (zip_handle)
     {
         try
         {
-            checkResult(zipClose(handle, /* global_comment= */ nullptr));
+            zipCloseFileInZip(zip_handle);
+            zipClose(zip_handle, /* global_comment= */ nullptr);
         }
         catch (...)
         {
@@ -273,13 +271,38 @@ ZipArchiveWriter::~ZipArchiveWriter()
 
 std::unique_ptr<WriteBufferFromFileBase> ZipArchiveWriter::writeFile(const String & filename)
 {
-    return std::make_unique<WriteBufferFromZipArchive>(acquireHandle(), filename);
+    return std::make_unique<WriteBufferFromZipArchive>(std::static_pointer_cast<ZipArchiveWriter>(shared_from_this()), filename);
 }
 
 bool ZipArchiveWriter::isWritingFile() const
 {
     std::lock_guard lock{mutex};
-    return !handle;
+    return is_writing_file;
+}
+
+void ZipArchiveWriter::finalize()
+{
+    std::lock_guard lock{mutex};
+    if (finalized)
+        return;
+
+    if (is_writing_file)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "ZipArchiveWriter::finalize() is called in the middle of writing a file into the zip archive. That's not allowed");
+
+    if (zip_handle)
+    {
+        int code = zipClose(zip_handle, /* global_comment= */ nullptr);
+        zip_handle = nullptr;
+        checkResultCode(code);
+    }
+
+    if (stream_info)
+    {
+        stream_info->getWriteBuffer().finalize();
+        stream_info.reset();
+    }
+
+    finalized = true;
 }
 
 void ZipArchiveWriter::setCompression(const String & compression_method_, int compression_level_)
@@ -289,12 +312,30 @@ void ZipArchiveWriter::setCompression(const String & compression_method_, int co
     compression_level = compression_level_;
 }
 
+int ZipArchiveWriter::getCompressionMethod() const
+{
+    std::lock_guard lock{mutex};
+    return compression_method;
+}
+
+int ZipArchiveWriter::getCompressionLevel() const
+{
+    std::lock_guard lock{mutex};
+    return compression_level;
+}
+
 void ZipArchiveWriter::setPassword(const String & password_)
 {
     std::lock_guard lock{mutex};
     password = password_;
 }
 
+String ZipArchiveWriter::getPassword() const
+{
+    std::lock_guard lock{mutex};
+    return password;
+}
+
 int ZipArchiveWriter::compressionMethodToInt(const String & compression_method_)
 {
     if (compression_method_.empty())
@@ -361,45 +402,24 @@ void ZipArchiveWriter::checkEncryptionIsEnabled()
 #endif
 }
 
-ZipArchiveWriter::HandleHolder ZipArchiveWriter::acquireHandle()
-{
-    return HandleHolder{std::static_pointer_cast<ZipArchiveWriter>(shared_from_this())};
-}
-
-RawHandle ZipArchiveWriter::acquireRawHandle()
+ZipArchiveWriter::ZipHandle ZipArchiveWriter::startWritingFile()
 {
     std::lock_guard lock{mutex};
-    if (!handle)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot have more than one write buffer while writing a zip archive");
-    return std::exchange(handle, nullptr);
+    if (is_writing_file)
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Cannot write two files to a zip archive in parallel");
+    is_writing_file = true;
+    return zip_handle;
 }
 
-void ZipArchiveWriter::releaseRawHandle(RawHandle raw_handle_)
+void ZipArchiveWriter::endWritingFile()
 {
     std::lock_guard lock{mutex};
-    handle = raw_handle_;
+    is_writing_file = false;
 }
 
-void ZipArchiveWriter::checkResult(int code) const
+void ZipArchiveWriter::checkResultCode(int code) const
 {
-    if (code >= ZIP_OK)
-        return;
-
-    String message = "Code = ";
-    switch (code)
-    {
-        case ZIP_ERRNO: message += "ERRNO, errno = " + errnoToString(); break;
-        case ZIP_PARAMERROR: message += "PARAMERROR"; break;
-        case ZIP_BADZIPFILE: message += "BADZIPFILE"; break;
-        case ZIP_INTERNALERROR: message += "INTERNALERROR"; break;
-        default: message += std::to_string(code); break;
-    }
-    showError(message);
-}
-
-void ZipArchiveWriter::showError(const String & message) const
-{
-    throw Exception(ErrorCodes::CANNOT_PACK_ARCHIVE, "Couldn't pack zip archive {}: {}", quoteString(path_to_archive), message);
+    checkResultCodeImpl(code, path_to_archive);
 }
 
 }
diff --git a/src/IO/Archives/ZipArchiveWriter.h b/src/IO/Archives/ZipArchiveWriter.h
index a54130556b3..891da1a2e75 100644
--- a/src/IO/Archives/ZipArchiveWriter.h
+++ b/src/IO/Archives/ZipArchiveWriter.h
@@ -4,6 +4,7 @@
 
 #if USE_MINIZIP
 #include <IO/Archives/IArchiveWriter.h>
+#include <base/defines.h>
 #include <mutex>
 
 
@@ -22,7 +23,7 @@ public:
     /// Constructs an archive that will be written by using a specified `archive_write_buffer_`.
     ZipArchiveWriter(const String & path_to_archive_, std::unique_ptr<WriteBuffer> archive_write_buffer_);
 
-    /// Destructors finalizes writing the archive.
+    /// Call finalize() before destructing IArchiveWriter.
     ~ZipArchiveWriter() override;
 
     /// Starts writing a file to the archive. The function returns a write buffer,
@@ -35,6 +36,10 @@ public:
     /// This function should be used mostly for debugging purposes.
     bool isWritingFile() const override;
 
+    /// Finalizes writing of the archive. This function must be always called at the end of writing.
+    /// (Unless an error appeared and the archive is in fact no longer needed.)
+    void finalize() override;
+
     /// Supported compression methods.
     static constexpr const char kStore[] = "store";
     static constexpr const char kDeflate[] = "deflate";
@@ -68,22 +73,27 @@ public:
     static void checkEncryptionIsEnabled();
 
 private:
+    class StreamInfo;
+    using ZipHandle = void *;
     class WriteBufferFromZipArchive;
-    class HandleHolder;
-    using RawHandle = void *;
 
-    HandleHolder acquireHandle();
-    RawHandle acquireRawHandle();
-    void releaseRawHandle(RawHandle raw_handle_);
+    int getCompressionMethod() const;
+    int getCompressionLevel() const;
+    String getPassword() const;
 
-    void checkResult(int code) const;
-    [[noreturn]] void showError(const String & message) const;
+    ZipHandle startWritingFile();
+    void endWritingFile();
+
+    void checkResultCode(int code) const;
 
     const String path_to_archive;
-    int compression_method; /// By default the compression method is "deflate".
-    int compression_level = kDefaultCompressionLevel;
-    String password;
-    RawHandle handle = nullptr;
+    std::unique_ptr<StreamInfo> TSA_GUARDED_BY(mutex) stream_info;
+    int compression_method TSA_GUARDED_BY(mutex); /// By default the compression method is "deflate".
+    int compression_level TSA_GUARDED_BY(mutex) = kDefaultCompressionLevel;
+    String password TSA_GUARDED_BY(mutex);
+    ZipHandle zip_handle TSA_GUARDED_BY(mutex) = nullptr;
+    bool is_writing_file TSA_GUARDED_BY(mutex) = false;
+    bool finalized TSA_GUARDED_BY(mutex) = false;
     mutable std::mutex mutex;
 };
 
diff --git a/src/IO/AsynchronousReadBufferFromFile.cpp b/src/IO/AsynchronousReadBufferFromFile.cpp
index 0e6c8090cb5..c6fe16a7f14 100644
--- a/src/IO/AsynchronousReadBufferFromFile.cpp
+++ b/src/IO/AsynchronousReadBufferFromFile.cpp
@@ -46,13 +46,13 @@ AsynchronousReadBufferFromFile::AsynchronousReadBufferFromFile(
     fd = ::open(file_name.c_str(), flags == -1 ? O_RDONLY | O_CLOEXEC : flags | O_CLOEXEC);
 
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + file_name, file_name,
-                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot open file {}", file_name);
 #ifdef OS_DARWIN
     if (o_direct)
     {
         if (fcntl(fd, F_NOCACHE, 1) == -1)
-            throwFromErrnoWithPath("Cannot set F_NOCACHE on file " + file_name, file_name, ErrorCodes::CANNOT_OPEN_FILE);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot set F_NOCACHE on file {}", file_name);
     }
 #endif
 }
diff --git a/src/IO/BitHelpers.h b/src/IO/BitHelpers.h
index a9c7343f991..45c9b1ba572 100644
--- a/src/IO/BitHelpers.h
+++ b/src/IO/BitHelpers.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <algorithm>
 #include <bit>
 #include <base/types.h>
 #include <Common/BitHelpers.h>
diff --git a/src/IO/ConnectionTimeouts.cpp b/src/IO/ConnectionTimeouts.cpp
index 970afc75ec3..88073a72d78 100644
--- a/src/IO/ConnectionTimeouts.cpp
+++ b/src/IO/ConnectionTimeouts.cpp
@@ -133,6 +133,22 @@ ConnectionTimeouts ConnectionTimeouts::getHTTPTimeouts(const Settings & settings
         settings.http_receive_timeout);
 }
 
+ConnectionTimeouts ConnectionTimeouts::getFetchPartHTTPTimeouts(const ServerSettings & server_settings, const Settings & user_settings)
+{
+    auto timeouts = getHTTPTimeouts(user_settings, server_settings.keep_alive_timeout);
+
+    if (server_settings.replicated_fetches_http_connection_timeout.changed)
+        timeouts.connection_timeout = server_settings.replicated_fetches_http_connection_timeout;
+
+    if (server_settings.replicated_fetches_http_send_timeout.changed)
+        timeouts.send_timeout = server_settings.replicated_fetches_http_send_timeout;
+
+    if (server_settings.replicated_fetches_http_receive_timeout.changed)
+        timeouts.receive_timeout = server_settings.replicated_fetches_http_receive_timeout;
+
+    return timeouts;
+}
+
 class SendReceiveTimeoutsForFirstAttempt
 {
 private:
diff --git a/src/IO/ConnectionTimeouts.h b/src/IO/ConnectionTimeouts.h
index aabebdb836d..42c4312d1d8 100644
--- a/src/IO/ConnectionTimeouts.h
+++ b/src/IO/ConnectionTimeouts.h
@@ -1,6 +1,7 @@
 #pragma once
 
 #include <Core/Defines.h>
+#include <Core/ServerSettings.h>
 #include <Interpreters/Context_fwd.h>
 
 #include <Poco/Timespan.h>
@@ -68,6 +69,8 @@ struct ConnectionTimeouts
     static ConnectionTimeouts getTCPTimeoutsWithFailover(const Settings & settings);
     static ConnectionTimeouts getHTTPTimeouts(const Settings & settings, Poco::Timespan http_keep_alive_timeout);
 
+    static ConnectionTimeouts getFetchPartHTTPTimeouts(const ServerSettings & server_settings, const Settings & user_settings);
+
     ConnectionTimeouts getAdaptiveTimeouts(const String & method, bool first_attempt, bool first_byte) const;
 };
 
diff --git a/src/IO/FileEncryptionCommon.cpp b/src/IO/FileEncryptionCommon.cpp
index 6f4db4975f7..c3348ef6068 100644
--- a/src/IO/FileEncryptionCommon.cpp
+++ b/src/IO/FileEncryptionCommon.cpp
@@ -97,7 +97,7 @@ namespace
             uint8_t * ciphertext = reinterpret_cast<uint8_t *>(out.position());
             int ciphertext_size = 0;
             if (!EVP_EncryptUpdate(evp_ctx, ciphertext, &ciphertext_size, &in[in_size], static_cast<int>(part_size)))
-                throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to encrypt");
+                throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to encrypt: {}", ERR_get_error());
 
             in_size += part_size;
             if (ciphertext_size)
@@ -120,7 +120,7 @@ namespace
         uint8_t ciphertext[kBlockSize];
         int ciphertext_size = 0;
         if (!EVP_EncryptUpdate(evp_ctx, ciphertext, &ciphertext_size, padded_data, safe_cast<int>(padded_data_size)))
-            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to encrypt");
+            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to encrypt: {}", ERR_get_error());
 
         if (!ciphertext_size)
             return 0;
@@ -140,7 +140,7 @@ namespace
         int ciphertext_size = 0;
         if (!EVP_EncryptFinal_ex(evp_ctx,
                                  ciphertext, &ciphertext_size))
-            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to finalize encrypting");
+            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to finalize encrypting: {}", ERR_get_error());
         if (ciphertext_size)
             out.write(reinterpret_cast<const char *>(ciphertext), ciphertext_size);
         return ciphertext_size;
@@ -152,7 +152,7 @@ namespace
         uint8_t * plaintext = reinterpret_cast<uint8_t *>(out);
         int plaintext_size = 0;
         if (!EVP_DecryptUpdate(evp_ctx, plaintext, &plaintext_size, in, safe_cast<int>(size)))
-            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to decrypt");
+            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to decrypt: {}", ERR_get_error());
         return plaintext_size;
     }
 
@@ -165,7 +165,7 @@ namespace
         uint8_t plaintext[kBlockSize];
         int plaintext_size = 0;
         if (!EVP_DecryptUpdate(evp_ctx, plaintext, &plaintext_size, padded_data, safe_cast<int>(padded_data_size)))
-            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to decrypt");
+            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to decrypt: {}", ERR_get_error());
 
         if (!plaintext_size)
             return 0;
@@ -184,7 +184,7 @@ namespace
         uint8_t plaintext[kBlockSize];
         int plaintext_size = 0;
         if (!EVP_DecryptFinal_ex(evp_ctx, plaintext, &plaintext_size))
-            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to finalize decrypting");
+            throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to finalize decrypting: {}", ERR_get_error());
         if (plaintext_size)
             memcpy(out, plaintext, plaintext_size);
         return plaintext_size;
@@ -291,11 +291,11 @@ void Encryptor::encrypt(const char * data, size_t size, WriteBuffer & out)
     auto * evp_ctx = evp_ctx_ptr.get();
 
     if (!EVP_EncryptInit_ex(evp_ctx, evp_cipher, nullptr, nullptr, nullptr))
-        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to initialize encryption context with cipher");
+        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to initialize encryption context with cipher: {}", ERR_get_error());
 
     if (!EVP_EncryptInit_ex(evp_ctx, nullptr, nullptr,
                             reinterpret_cast<const uint8_t*>(key.c_str()), reinterpret_cast<const uint8_t*>(current_iv.c_str())))
-        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to set key and IV for encryption");
+        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to set key and IV for encryption: {}", ERR_get_error());
 
     size_t in_size = 0;
     size_t out_size = 0;
@@ -320,7 +320,7 @@ void Encryptor::encrypt(const char * data, size_t size, WriteBuffer & out)
     out_size += encryptFinal(evp_ctx, out);
 
     if (out_size != in_size)
-        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Only part of the data was encrypted");
+        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Only part of the data was encrypted: {} out of {} bytes", out_size, in_size);
     offset += in_size;
 }
 
@@ -335,11 +335,11 @@ void Encryptor::decrypt(const char * data, size_t size, char * out)
     auto * evp_ctx = evp_ctx_ptr.get();
 
     if (!EVP_DecryptInit_ex(evp_ctx, evp_cipher, nullptr, nullptr, nullptr))
-        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to initialize decryption context with cipher");
+        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to initialize decryption context with cipher: {}", ERR_get_error());
 
     if (!EVP_DecryptInit_ex(evp_ctx, nullptr, nullptr,
                             reinterpret_cast<const uint8_t*>(key.c_str()), reinterpret_cast<const uint8_t*>(current_iv.c_str())))
-        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to set key and IV for decryption");
+        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Failed to set key and IV for decryption: {}", ERR_get_error());
 
     size_t in_size = 0;
     size_t out_size = 0;
@@ -364,7 +364,7 @@ void Encryptor::decrypt(const char * data, size_t size, char * out)
     out_size += decryptFinal(evp_ctx, &out[out_size]);
 
     if (out_size != in_size)
-        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Only part of the data was decrypted");
+        throw Exception(ErrorCodes::DATA_ENCRYPTION_ERROR, "Only part of the data was decrypted: {} out of {} bytes", out_size, in_size);
     offset += in_size;
 }
 
diff --git a/src/IO/MMapReadBufferFromFile.cpp b/src/IO/MMapReadBufferFromFile.cpp
index 0596eba565f..d3eb11c920d 100644
--- a/src/IO/MMapReadBufferFromFile.cpp
+++ b/src/IO/MMapReadBufferFromFile.cpp
@@ -29,8 +29,8 @@ void MMapReadBufferFromFile::open()
     fd = ::open(file_name.c_str(), O_RDONLY | O_CLOEXEC);
 
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + file_name, file_name,
-                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot open file {}", file_name);
 }
 
 
diff --git a/src/IO/MMapReadBufferFromFileWithCache.cpp b/src/IO/MMapReadBufferFromFileWithCache.cpp
index d13cf5db2f7..d53f3bc325d 100644
--- a/src/IO/MMapReadBufferFromFileWithCache.cpp
+++ b/src/IO/MMapReadBufferFromFileWithCache.cpp
@@ -1,4 +1,5 @@
 #include <IO/MMapReadBufferFromFileWithCache.h>
+#include <base/getPageSize.h>
 
 
 namespace DB
diff --git a/src/IO/MMappedFile.cpp b/src/IO/MMappedFile.cpp
index 9e45140d5f9..7249a25decb 100644
--- a/src/IO/MMappedFile.cpp
+++ b/src/IO/MMappedFile.cpp
@@ -30,8 +30,8 @@ void MMappedFile::open()
     fd = ::open(file_name.c_str(), O_RDONLY | O_CLOEXEC);
 
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + file_name, file_name,
-                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot open file {}", file_name);
 }
 
 
diff --git a/src/IO/MMappedFileDescriptor.cpp b/src/IO/MMappedFileDescriptor.cpp
index 9cc1aaf656c..ebc4e7a6bbb 100644
--- a/src/IO/MMappedFileDescriptor.cpp
+++ b/src/IO/MMappedFileDescriptor.cpp
@@ -28,7 +28,7 @@ static size_t getFileSize(int fd)
 {
     struct stat stat_res {};
     if (0 != fstat(fd, &stat_res))
-        throwFromErrno("MMappedFileDescriptor: Cannot fstat.", ErrorCodes::CANNOT_STAT);
+        throw ErrnoException(ErrorCodes::CANNOT_STAT, "MMappedFileDescriptor: Cannot fstat");
 
     off_t file_size = stat_res.st_size;
 
@@ -63,8 +63,7 @@ void MMappedFileDescriptor::set(int fd_, size_t offset_, size_t length_)
 
     void * buf = mmap(nullptr, length, PROT_READ, MAP_PRIVATE, fd, offset);
     if (MAP_FAILED == buf)
-        throwFromErrno(fmt::format("MMappedFileDescriptor: Cannot mmap {}.", ReadableSize(length)),
-            ErrorCodes::CANNOT_ALLOCATE_MEMORY);
+        throw ErrnoException(ErrorCodes::CANNOT_ALLOCATE_MEMORY, "MMappedFileDescriptor: Cannot mmap {}", ReadableSize(length));
 
     data = static_cast<char *>(buf);
 
@@ -88,8 +87,7 @@ void MMappedFileDescriptor::finish()
         return;
 
     if (0 != munmap(data, length))
-        throwFromErrno(fmt::format("MMappedFileDescriptor: Cannot munmap {}.", ReadableSize(length)),
-            ErrorCodes::CANNOT_MUNMAP);
+        throw ErrnoException(ErrorCodes::CANNOT_MUNMAP, "MMappedFileDescriptor: Cannot munmap {}", ReadableSize(length));
 
     length = 0;
 
diff --git a/src/IO/OpenedFile.cpp b/src/IO/OpenedFile.cpp
index b75e087e5c3..4677a8259db 100644
--- a/src/IO/OpenedFile.cpp
+++ b/src/IO/OpenedFile.cpp
@@ -30,8 +30,8 @@ void OpenedFile::open() const
     fd = ::open(file_name.c_str(), (flags == -1 ? 0 : flags) | O_RDONLY | O_CLOEXEC);
 
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + file_name, file_name,
-            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        DB::ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot open file {}", file_name);
 }
 
 int OpenedFile::getFD() const
diff --git a/src/IO/PeekableReadBuffer.cpp b/src/IO/PeekableReadBuffer.cpp
index ce9c20e7a53..be650f2f3b4 100644
--- a/src/IO/PeekableReadBuffer.cpp
+++ b/src/IO/PeekableReadBuffer.cpp
@@ -20,33 +20,6 @@ PeekableReadBuffer::PeekableReadBuffer(ReadBuffer & sub_buf_, size_t start_size_
     checkStateCorrect();
 }
 
-void PeekableReadBuffer::reset()
-{
-    checkStateCorrect();
-}
-
-void PeekableReadBuffer::setSubBuffer(ReadBuffer & sub_buf_)
-{
-    sub_buf = &sub_buf_;
-    resetImpl();
-}
-
-void PeekableReadBuffer::resetImpl()
-{
-    peeked_size = 0;
-    checkpoint = std::nullopt;
-    checkpoint_in_own_memory = false;
-    use_stack_memory = true;
-
-    if (!currentlyReadFromOwnMemory())
-        sub_buf->position() = pos;
-
-    Buffer & sub_working = sub_buf->buffer();
-    BufferBase::set(sub_working.begin(), sub_working.size(), sub_buf->offset());
-
-    checkStateCorrect();
-}
-
 bool PeekableReadBuffer::peekNext()
 {
     checkStateCorrect();
diff --git a/src/IO/PeekableReadBuffer.h b/src/IO/PeekableReadBuffer.h
index 78cb319327d..2ee209ffd6c 100644
--- a/src/IO/PeekableReadBuffer.h
+++ b/src/IO/PeekableReadBuffer.h
@@ -74,12 +74,6 @@ public:
     /// This data will be lost after destruction of peekable buffer.
     bool hasUnreadData() const;
 
-    // for streaming reading (like in Kafka) we need to restore initial state of the buffer
-    // without recreating the buffer.
-    void reset();
-
-    void setSubBuffer(ReadBuffer & sub_buf_);
-
     const ReadBuffer & getSubBuffer() const { return *sub_buf; }
 
 private:
diff --git a/src/IO/ReadBufferFromFile.cpp b/src/IO/ReadBufferFromFile.cpp
index 79ac62c6421..cb987171bad 100644
--- a/src/IO/ReadBufferFromFile.cpp
+++ b/src/IO/ReadBufferFromFile.cpp
@@ -45,13 +45,13 @@ ReadBufferFromFile::ReadBufferFromFile(
     fd = ::open(file_name.c_str(), flags == -1 ? O_RDONLY | O_CLOEXEC : flags | O_CLOEXEC);
 
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + file_name, file_name,
-                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot open file {}", file_name);
 #ifdef OS_DARWIN
     if (o_direct)
     {
         if (fcntl(fd, F_NOCACHE, 1) == -1)
-            throwFromErrnoWithPath("Cannot set F_NOCACHE on file " + file_name, file_name, ErrorCodes::CANNOT_OPEN_FILE);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot set F_NOCACHE on file {}", file_name);
     }
 #endif
 }
diff --git a/src/IO/ReadBufferFromFileDescriptor.cpp b/src/IO/ReadBufferFromFileDescriptor.cpp
index 6c0c1681a4c..3211f8eeb35 100644
--- a/src/IO/ReadBufferFromFileDescriptor.cpp
+++ b/src/IO/ReadBufferFromFileDescriptor.cpp
@@ -39,7 +39,6 @@ namespace ErrorCodes
     extern const int CANNOT_READ_FROM_FILE_DESCRIPTOR;
     extern const int ARGUMENT_OUT_OF_BOUND;
     extern const int CANNOT_SEEK_THROUGH_FILE;
-    extern const int CANNOT_SELECT;
     extern const int CANNOT_ADVISE;
 }
 
@@ -81,7 +80,8 @@ size_t ReadBufferFromFileDescriptor::readImpl(char * to, size_t min_bytes, size_
         if (-1 == res && errno != EINTR)
         {
             ProfileEvents::increment(ProfileEvents::ReadBufferFromFileDescriptorReadFailed);
-            throwFromErrnoWithPath("Cannot read from file: " + getFileName(), getFileName(), ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+            ErrnoException::throwFromPath(
+                ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, getFileName(), "Cannot read from file {}", getFileName());
         }
 
         if (res > 0)
@@ -146,7 +146,7 @@ void ReadBufferFromFileDescriptor::prefetch(Priority)
 
     /// Ask OS to prefetch data into page cache.
     if (0 != posix_fadvise(fd, file_offset_of_buffer_end, internal_buffer.size(), POSIX_FADV_WILLNEED))
-        throwFromErrno("Cannot posix_fadvise", ErrorCodes::CANNOT_ADVISE);
+        throw ErrnoException(ErrorCodes::CANNOT_ADVISE, "Cannot posix_fadvise");
 #endif
 }
 
@@ -209,8 +209,12 @@ off_t ReadBufferFromFileDescriptor::seek(off_t offset, int whence)
 
             off_t res = ::lseek(fd, seek_pos, SEEK_SET);
             if (-1 == res)
-                throwFromErrnoWithPath(fmt::format("Cannot seek through file {} at offset {}", getFileName(), seek_pos), getFileName(),
-                    ErrorCodes::CANNOT_SEEK_THROUGH_FILE);
+                ErrnoException::throwFromPath(
+                    ErrorCodes::CANNOT_SEEK_THROUGH_FILE,
+                    getFileName(),
+                    "Cannot seek through file {} at offset {}",
+                    getFileName(),
+                    seek_pos);
 
             /// Also note that seeking past the file size is not allowed.
             if (res != seek_pos)
@@ -238,8 +242,8 @@ void ReadBufferFromFileDescriptor::rewind()
         ProfileEvents::increment(ProfileEvents::Seek);
         off_t res = ::lseek(fd, 0, SEEK_SET);
         if (-1 == res)
-            throwFromErrnoWithPath("Cannot seek through file " + getFileName(), getFileName(),
-                ErrorCodes::CANNOT_SEEK_THROUGH_FILE);
+            ErrnoException::throwFromPath(
+                ErrorCodes::CANNOT_SEEK_THROUGH_FILE, getFileName(), "Cannot seek through file {}", getFileName());
     }
     /// In case of pread, the ProfileEvents::Seek is not accounted, but it's Ok.
 
@@ -249,24 +253,6 @@ void ReadBufferFromFileDescriptor::rewind()
     file_offset_of_buffer_end = 0;
 }
 
-
-/// Assuming file descriptor supports 'select', check that we have data to read or wait until timeout.
-bool ReadBufferFromFileDescriptor::poll(size_t timeout_microseconds) const
-{
-    fd_set fds;
-    FD_ZERO(&fds);
-    FD_SET(fd, &fds);
-    timeval timeout = { time_t(timeout_microseconds / 1000000), suseconds_t(timeout_microseconds % 1000000) };
-
-    int res = select(1, &fds, nullptr, nullptr, &timeout);
-
-    if (-1 == res)
-        throwFromErrno("Cannot select", ErrorCodes::CANNOT_SELECT);
-
-    return res > 0;
-}
-
-
 size_t ReadBufferFromFileDescriptor::getFileSize()
 {
     return getSizeFromFileDescriptor(fd, getFileName());
diff --git a/src/IO/ReadBufferFromFileDescriptor.h b/src/IO/ReadBufferFromFileDescriptor.h
index 64340770cf2..4762998c67b 100644
--- a/src/IO/ReadBufferFromFileDescriptor.h
+++ b/src/IO/ReadBufferFromFileDescriptor.h
@@ -75,10 +75,6 @@ public:
 
     size_t readBigAt(char * to, size_t n, size_t offset, const std::function<bool(size_t)> &) override;
     bool supportsReadAt() override { return use_pread; }
-
-private:
-    /// Assuming file descriptor supports 'select', check that we have data to read or wait until timeout.
-    bool poll(size_t timeout_microseconds) const;
 };
 
 
diff --git a/src/IO/ReadBufferFromIStream.cpp b/src/IO/ReadBufferFromIStream.cpp
index e0c966fb700..3b3bdb5c564 100644
--- a/src/IO/ReadBufferFromIStream.cpp
+++ b/src/IO/ReadBufferFromIStream.cpp
@@ -34,6 +34,11 @@ bool ReadBufferFromIStream::nextImpl()
 ReadBufferFromIStream::ReadBufferFromIStream(std::istream & istr_, size_t size)
     : BufferWithOwnMemory<ReadBuffer>(size), istr(istr_)
 {
+    /// - badbit will be set if some exception will be throw from ios implementation
+    /// - failbit can be set when for instance read() reads less data, so we
+    ///   cannot set it, since we are requesting to read more data, then the
+    ///   buffer has now.
+    istr.exceptions(std::ios::badbit);
 }
 
 }
diff --git a/src/IO/ReadBufferFromS3.cpp b/src/IO/ReadBufferFromS3.cpp
index c9c9319c44c..619fd40edc3 100644
--- a/src/IO/ReadBufferFromS3.cpp
+++ b/src/IO/ReadBufferFromS3.cpp
@@ -196,7 +196,7 @@ bool ReadBufferFromS3::nextImpl()
             next_result = impl->next();
             break;
         }
-        catch (Exception & e)
+        catch (Poco::Exception & e)
         {
             if (!processException(e, getPosition(), attempt) || last_attempt)
                 throw;
@@ -515,7 +515,9 @@ Aws::S3::Model::GetObjectResult ReadBufferFromS3::sendRequest(size_t attempt, si
     // We do not know in advance how many bytes we are going to consume, to avoid blocking estimated it from below
     constexpr ResourceCost estimated_cost = 1;
     ResourceGuard rlock(read_settings.resource_link, estimated_cost);
+
     Aws::S3::Model::GetObjectOutcome outcome = client_ptr->GetObject(req);
+
     rlock.unlock();
 
     if (outcome.IsSuccess())
diff --git a/src/IO/ReadHelpers.cpp b/src/IO/ReadHelpers.cpp
index 19750906fdb..256354b2833 100644
--- a/src/IO/ReadHelpers.cpp
+++ b/src/IO/ReadHelpers.cpp
@@ -89,7 +89,7 @@ void NO_INLINE throwAtAssertionFailed(const char * s, ReadBuffer & buf)
     else
         out << " before: " << quote << String(buf.position(), std::min(SHOW_CHARS_ON_SYNTAX_ERROR, buf.buffer().end() - buf.position()));
 
-    throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "Cannot parse input: expected {}", out.str());
+    throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "Cannot parse input: expected {}", out.str());
 }
 
 
@@ -562,7 +562,7 @@ static ReturnType readAnyQuotedStringInto(Vector & s, ReadBuffer & buf)
     if (buf.eof() || *buf.position() != quote)
     {
         if constexpr (throw_exception)
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_QUOTED_STRING,
+            throw Exception(ErrorCodes::CANNOT_PARSE_QUOTED_STRING,
                 "Cannot parse quoted string: expected opening quote '{}', got '{}'",
                 std::string{quote}, buf.eof() ? "EOF" : std::string{*buf.position()});
         else
@@ -608,7 +608,7 @@ static ReturnType readAnyQuotedStringInto(Vector & s, ReadBuffer & buf)
     }
 
     if constexpr (throw_exception)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_QUOTED_STRING, "Cannot parse quoted string: expected closing quote");
+        throw Exception(ErrorCodes::CANNOT_PARSE_QUOTED_STRING, "Cannot parse quoted string: expected closing quote");
     else
         return ReturnType(false);
 }
@@ -958,7 +958,7 @@ ReturnType readJSONStringInto(Vector & s, ReadBuffer & buf)
     auto error = [](FormatStringHelper<> message [[maybe_unused]], int code [[maybe_unused]])
     {
         if constexpr (throw_exception)
-            throw ParsingException(code, std::move(message));
+            throw Exception(code, std::move(message));
         return ReturnType(false);
     };
 
@@ -1009,7 +1009,7 @@ ReturnType readJSONObjectOrArrayPossiblyInvalid(Vector & s, ReadBuffer & buf)
     auto error = [](FormatStringHelper<> message [[maybe_unused]], int code [[maybe_unused]])
     {
         if constexpr (throw_exception)
-            throw ParsingException(code, std::move(message));
+            throw Exception(code, std::move(message));
         return ReturnType(false);
     };
 
@@ -1185,7 +1185,7 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
         else
         {
             if constexpr (throw_exception)
-                throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime");
+                throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime");
             else
                 return false;
         }
@@ -1212,7 +1212,7 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
             s_pos[size] = 0;
 
             if constexpr (throw_exception)
-                throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime {}", s);
+                throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime {}", s);
             else
                 return false;
         }
@@ -1235,7 +1235,7 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
                 s_pos[size] = 0;
 
                 if constexpr (throw_exception)
-                    throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse time component of DateTime {}", s);
+                    throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse time component of DateTime {}", s);
                 else
                     return false;
             }
@@ -1266,7 +1266,7 @@ ReturnType readDateTimeTextFallback(time_t & datetime, ReadBuffer & buf, const D
         if (too_short && negative_multiplier != -1)
         {
             if constexpr (throw_exception)
-                throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime");
+                throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime");
             else
                 return false;
         }
@@ -1591,7 +1591,7 @@ void skipToNextRowOrEof(PeekableReadBuffer & buf, const String & row_after_delim
         if (skip_spaces)
             skipWhitespaceIfAny(buf);
 
-        if (checkString(row_between_delimiter, buf))
+        if (buf.eof() || checkString(row_between_delimiter, buf))
             break;
     }
 }
diff --git a/src/IO/ReadHelpers.h b/src/IO/ReadHelpers.h
index 17f3d3d4151..85584d63ee8 100644
--- a/src/IO/ReadHelpers.h
+++ b/src/IO/ReadHelpers.h
@@ -41,6 +41,7 @@
 #include <IO/PeekableReadBuffer.h>
 #include <IO/VarInt.h>
 
+#include <pcg_random.hpp>
 #include <double-conversion/double-conversion.h>
 
 static constexpr auto DEFAULT_MAX_STRING_SIZE = 1_GiB;
@@ -295,7 +296,7 @@ inline void readBoolTextWord(bool & x, ReadBuffer & buf, bool support_upper_case
                 [[fallthrough]];
         }
         default:
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_BOOL, "Unexpected Bool value");
+            throw Exception(ErrorCodes::CANNOT_PARSE_BOOL, "Unexpected Bool value");
     }
 }
 
@@ -339,7 +340,7 @@ ReturnType readIntTextImpl(T & x, ReadBuffer & buf)
                 if (has_sign)
                 {
                     if constexpr (throw_exception)
-                        throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER,
+                        throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER,
                             "Cannot parse number with multiple sign (+/-) characters");
                     else
                         return ReturnType(false);
@@ -356,7 +357,7 @@ ReturnType readIntTextImpl(T & x, ReadBuffer & buf)
                 if (has_sign)
                 {
                     if constexpr (throw_exception)
-                        throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER,
+                        throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER,
                             "Cannot parse number with multiple sign (+/-) characters");
                     else
                         return ReturnType(false);
@@ -367,7 +368,7 @@ ReturnType readIntTextImpl(T & x, ReadBuffer & buf)
                 else
                 {
                     if constexpr (throw_exception)
-                        throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Unsigned type must not contain '-' symbol");
+                        throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Unsigned type must not contain '-' symbol");
                     else
                         return ReturnType(false);
                 }
@@ -429,7 +430,7 @@ end:
     if (has_sign && !has_number)
     {
         if constexpr (throw_exception)
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER,
+            throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER,
                 "Cannot parse number with a sign character but without any numeric character");
         else
             return ReturnType(false);
@@ -836,7 +837,7 @@ inline ReturnType readUUIDTextImpl(UUID & uuid, ReadBuffer & buf)
 
                 if constexpr (throw_exception)
                 {
-                    throw ParsingException(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse uuid {}", s);
+                    throw Exception(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse uuid {}", s);
                 }
                 else
                 {
@@ -854,7 +855,7 @@ inline ReturnType readUUIDTextImpl(UUID & uuid, ReadBuffer & buf)
 
         if constexpr (throw_exception)
         {
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse uuid {}", s);
+            throw Exception(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse uuid {}", s);
         }
         else
         {
@@ -880,7 +881,7 @@ inline ReturnType readIPv4TextImpl(IPv4 & ip, ReadBuffer & buf)
         return ReturnType(true);
 
     if constexpr (std::is_same_v<ReturnType, void>)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_IPV4, "Cannot parse IPv4 {}", std::string_view(buf.position(), buf.available()));
+        throw Exception(ErrorCodes::CANNOT_PARSE_IPV4, "Cannot parse IPv4 {}", std::string_view(buf.position(), buf.available()));
     else
         return ReturnType(false);
 }
@@ -902,7 +903,7 @@ inline ReturnType readIPv6TextImpl(IPv6 & ip, ReadBuffer & buf)
         return ReturnType(true);
 
     if constexpr (std::is_same_v<ReturnType, void>)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_IPV6, "Cannot parse IPv6 {}", std::string_view(buf.position(), buf.available()));
+        throw Exception(ErrorCodes::CANNOT_PARSE_IPV6, "Cannot parse IPv6 {}", std::string_view(buf.position(), buf.available()));
     else
         return ReturnType(false);
 }
@@ -943,7 +944,7 @@ inline ReturnType readDateTimeTextImpl(time_t & datetime, ReadBuffer & buf, cons
         if (!buf.eof() && !isNumericASCII(*buf.position()))
         {
             if constexpr (throw_exception)
-                throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse datetime");
+                throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse datetime");
             else
                 return false;
         }
@@ -1016,7 +1017,7 @@ inline ReturnType readDateTimeTextImpl(DateTime64 & datetime64, UInt32 scale, Re
             {
                 readDateTimeTextImpl<ReturnType, true>(whole, buf, date_lut);
             }
-            catch (const DB::ParsingException &)
+            catch (const DB::Exception &)
             {
                 if (buf.eof() || *buf.position() != '.')
                     throw;
@@ -1124,7 +1125,7 @@ inline void readDateTimeText(LocalDateTime & datetime, ReadBuffer & buf)
     if (10 != size)
     {
         s[size] = 0;
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime {}", s);
+        throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime {}", s);
     }
 
     datetime.year((s[0] - '0') * 1000 + (s[1] - '0') * 100 + (s[2] - '0') * 10 + (s[3] - '0'));
@@ -1140,7 +1141,7 @@ inline void readDateTimeText(LocalDateTime & datetime, ReadBuffer & buf)
     if (8 != size)
     {
         s[size] = 0;
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse time component of DateTime {}", s);
+        throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse time component of DateTime {}", s);
     }
 
     datetime.hour((s[0] - '0') * 10 + (s[1] - '0'));
@@ -1173,7 +1174,7 @@ inline ReturnType readTimeTextImpl(time_t & time, ReadBuffer & buf)
         s[size] = 0;
 
         if constexpr (throw_exception)
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime {}", s);
+            throw Exception(ErrorCodes::CANNOT_PARSE_DATETIME, "Cannot parse DateTime {}", s);
         else
             return false;
     }
@@ -1481,7 +1482,7 @@ void readQuoted(std::vector<T> & x, ReadBuffer & buf)
             if (*buf.position() == ',')
                 ++buf.position();
             else
-                throw ParsingException(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Cannot read array from text");
+                throw Exception(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Cannot read array from text");
         }
 
         first = false;
@@ -1504,7 +1505,7 @@ void readDoubleQuoted(std::vector<T> & x, ReadBuffer & buf)
             if (*buf.position() == ',')
                 ++buf.position();
             else
-                throw ParsingException(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Cannot read array from text");
+                throw Exception(ErrorCodes::CANNOT_READ_ARRAY_FROM_TEXT, "Cannot read array from text");
         }
 
         first = false;
diff --git a/src/IO/ReadSettings.h b/src/IO/ReadSettings.h
index 4c8a6cb020a..a8a31d82e56 100644
--- a/src/IO/ReadSettings.h
+++ b/src/IO/ReadSettings.h
@@ -120,6 +120,7 @@ struct ReadSettings
     size_t http_retry_initial_backoff_ms = 100;
     size_t http_retry_max_backoff_ms = 1600;
     bool http_skip_not_found_url_for_globs = true;
+    bool http_make_head_request = true;
 
     /// Monitoring
     bool for_object_storage = false; // to choose which profile events should be incremented
diff --git a/src/IO/ReadWriteBufferFromHTTP.cpp b/src/IO/ReadWriteBufferFromHTTP.cpp
index 6dd6269e16f..297d73303c0 100644
--- a/src/IO/ReadWriteBufferFromHTTP.cpp
+++ b/src/IO/ReadWriteBufferFromHTTP.cpp
@@ -808,6 +808,11 @@ std::optional<time_t> ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::tryGetLa
 template <typename UpdatableSessionPtr>
 HTTPFileInfo ReadWriteBufferFromHTTPBase<UpdatableSessionPtr>::getFileInfo()
 {
+    /// May be disabled in case the user knows in advance that the server doesn't support HEAD requests.
+    /// Allows to avoid making unnecessary requests in such cases.
+    if (!settings.http_make_head_request)
+        return HTTPFileInfo{};
+
     Poco::Net::HTTPResponse response;
     try
     {
@@ -920,13 +925,12 @@ PooledReadWriteBufferFromHTTP::PooledReadWriteBufferFromHTTP(
     Poco::URI uri_,
     const std::string & method_,
     OutStreamCallback out_stream_callback_,
-    const ConnectionTimeouts & timeouts_,
     const Poco::Net::HTTPBasicCredentials & credentials_,
     size_t buffer_size_,
     const UInt64 max_redirects,
-    size_t max_connections_per_endpoint)
+    PooledSessionFactoryPtr session_factory)
     : Parent(
-        std::make_shared<SessionType>(uri_, max_redirects, std::make_shared<PooledSessionFactory>(timeouts_, max_connections_per_endpoint)),
+        std::make_shared<SessionType>(uri_, max_redirects, session_factory),
         uri_,
         credentials_,
         method_,
diff --git a/src/IO/ReadWriteBufferFromHTTP.h b/src/IO/ReadWriteBufferFromHTTP.h
index 8f0e2388e5b..29c0804bb28 100644
--- a/src/IO/ReadWriteBufferFromHTTP.h
+++ b/src/IO/ReadWriteBufferFromHTTP.h
@@ -265,6 +265,8 @@ private:
     size_t per_endpoint_pool_size;
 };
 
+using PooledSessionFactoryPtr = std::shared_ptr<PooledSessionFactory>;
+
 class PooledReadWriteBufferFromHTTP : public detail::ReadWriteBufferFromHTTPBase<std::shared_ptr<UpdatableSession<PooledSessionFactory>>>
 {
     using SessionType = UpdatableSession<PooledSessionFactory>;
@@ -273,13 +275,12 @@ class PooledReadWriteBufferFromHTTP : public detail::ReadWriteBufferFromHTTPBase
 public:
     explicit PooledReadWriteBufferFromHTTP(
         Poco::URI uri_,
-        const std::string & method_ = {},
-        OutStreamCallback out_stream_callback_ = {},
-        const ConnectionTimeouts & timeouts_ = {},
-        const Poco::Net::HTTPBasicCredentials & credentials_ = {},
-        size_t buffer_size_ = DBMS_DEFAULT_BUFFER_SIZE,
-        const UInt64 max_redirects = 0,
-        size_t max_connections_per_endpoint = DEFAULT_COUNT_OF_HTTP_CONNECTIONS_PER_ENDPOINT);
+        const std::string & method_,
+        OutStreamCallback out_stream_callback_,
+        const Poco::Net::HTTPBasicCredentials & credentials_,
+        size_t buffer_size_,
+        const UInt64 max_redirects,
+        PooledSessionFactoryPtr session_factory);
 };
 
 
diff --git a/src/IO/S3/Client.cpp b/src/IO/S3/Client.cpp
index 28a55580dc5..a65a82d9b40 100644
--- a/src/IO/S3/Client.cpp
+++ b/src/IO/S3/Client.cpp
@@ -125,11 +125,11 @@ std::unique_ptr<Client> Client::create(
     const std::shared_ptr<Aws::Auth::AWSCredentialsProvider> & credentials_provider,
     const PocoHTTPClientConfiguration & client_configuration,
     Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy sign_payloads,
-    bool use_virtual_addressing)
+    const ClientSettings & client_settings)
 {
     verifyClientConfiguration(client_configuration);
     return std::unique_ptr<Client>(
-        new Client(max_redirects_, std::move(sse_kms_config_), credentials_provider, client_configuration, sign_payloads, use_virtual_addressing));
+        new Client(max_redirects_, std::move(sse_kms_config_), credentials_provider, client_configuration, sign_payloads, client_settings));
 }
 
 std::unique_ptr<Client> Client::clone() const
@@ -159,12 +159,12 @@ Client::Client(
     const std::shared_ptr<Aws::Auth::AWSCredentialsProvider> & credentials_provider_,
     const PocoHTTPClientConfiguration & client_configuration_,
     Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy sign_payloads_,
-    bool use_virtual_addressing_)
-    : Aws::S3::S3Client(credentials_provider_, client_configuration_, sign_payloads_, use_virtual_addressing_)
+    const ClientSettings & client_settings_)
+    : Aws::S3::S3Client(credentials_provider_, client_configuration_, sign_payloads_, client_settings_.use_virtual_addressing)
     , credentials_provider(credentials_provider_)
     , client_configuration(client_configuration_)
     , sign_payloads(sign_payloads_)
-    , use_virtual_addressing(use_virtual_addressing_)
+    , client_settings(client_settings_)
     , max_redirects(max_redirects_)
     , sse_kms_config(std::move(sse_kms_config_))
     , log(&Poco::Logger::get("S3Client"))
@@ -204,12 +204,12 @@ Client::Client(
 Client::Client(
     const Client & other, const PocoHTTPClientConfiguration & client_configuration_)
     : Aws::S3::S3Client(other.credentials_provider, client_configuration_, other.sign_payloads,
-                        other.use_virtual_addressing)
+                        other.client_settings.use_virtual_addressing)
     , initial_endpoint(other.initial_endpoint)
     , credentials_provider(other.credentials_provider)
     , client_configuration(client_configuration_)
     , sign_payloads(other.sign_payloads)
-    , use_virtual_addressing(other.use_virtual_addressing)
+    , client_settings(other.client_settings)
     , explicit_region(other.explicit_region)
     , detect_region(other.detect_region)
     , provider_type(other.provider_type)
@@ -413,7 +413,7 @@ Model::CompleteMultipartUploadOutcome Client::CompleteMultipartUpload(CompleteMu
             outcome = Aws::S3::Model::CompleteMultipartUploadOutcome(Aws::S3::Model::CompleteMultipartUploadResult());
     }
 
-    if (outcome.IsSuccess() && provider_type == ProviderType::GCS)
+    if (outcome.IsSuccess() && provider_type == ProviderType::GCS && client_settings.gcs_issue_compose_request)
     {
         /// For GCS we will try to compose object at the end, otherwise we cannot do a native copy
         /// for the object (e.g. for backups)
@@ -511,6 +511,8 @@ Client::doRequest(RequestType & request, RequestFn request_fn) const
     addAdditionalAMZHeadersToCanonicalHeadersList(request, client_configuration.extra_headers);
     const auto & bucket = request.GetBucket();
     request.setApiMode(api_mode);
+    if (client_settings.disable_checksum)
+        request.disableChecksum();
 
     if (auto region = getRegionForBucket(bucket); !region.empty())
     {
@@ -568,6 +570,9 @@ Client::doRequest(RequestType & request, RequestFn request_fn) const
         if (!new_uri)
             return result;
 
+        if (initial_endpoint.substr(11) == "amazonaws.com") // Check if user didn't mention any region
+            new_uri->addRegionToURI(request.getRegionOverride());
+
         const auto & current_uri_override = request.getURIOverride();
         /// we already tried with this URI
         if (current_uri_override && current_uri_override->uri == new_uri->uri)
@@ -843,7 +848,7 @@ ClientFactory & ClientFactory::instance()
 
 std::unique_ptr<S3::Client> ClientFactory::create( // NOLINT
     const PocoHTTPClientConfiguration & cfg_,
-    bool is_virtual_hosted_style,
+    ClientSettings client_settings,
     const String & access_key_id,
     const String & secret_access_key,
     const String & server_side_encryption_customer_key_base64,
@@ -882,13 +887,17 @@ std::unique_ptr<S3::Client> ClientFactory::create( // NOLINT
 
     client_configuration.retryStrategy = std::make_shared<Client::RetryStrategy>(client_configuration.s3_retry_attempts);
 
+    /// Use virtual addressing if endpoint is not specified.
+    if (client_configuration.endpointOverride.empty())
+        client_settings.use_virtual_addressing = true;
+
     return Client::create(
         client_configuration.s3_max_redirects,
         std::move(sse_kms_config),
         credentials_provider,
         client_configuration, // Client configuration.
         Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::Never,
-        is_virtual_hosted_style || client_configuration.endpointOverride.empty() /// Use virtual addressing if endpoint is not specified.
+        client_settings
     );
 }
 
diff --git a/src/IO/S3/Client.h b/src/IO/S3/Client.h
index cf0d53d9c72..b137f0605dc 100644
--- a/src/IO/S3/Client.h
+++ b/src/IO/S3/Client.h
@@ -92,6 +92,23 @@ private:
     std::unordered_map<ClientCache *, std::weak_ptr<ClientCache>> client_caches;
 };
 
+struct ClientSettings
+{
+    bool use_virtual_addressing;
+    /// Disable checksum to avoid extra read of the input stream
+    bool disable_checksum;
+    /// Should client send ComposeObject request after upload to GCS.
+    ///
+    /// Previously ComposeObject request was required to make Copy possible,
+    /// but not anymore (see [1]).
+    ///
+    ///   [1]: https://cloud.google.com/storage/docs/release-notes#June_23_2023
+    ///
+    /// Ability to enable it preserved since likely it is required for old
+    /// files.
+    bool gcs_issue_compose_request;
+};
+
 /// Client that improves the client from the AWS SDK
 /// - inject region and URI into requests so they are rerouted to the correct destination if needed
 /// - automatically detect endpoint and regions for each bucket and cache them
@@ -116,7 +133,7 @@ public:
             const std::shared_ptr<Aws::Auth::AWSCredentialsProvider> & credentials_provider,
             const PocoHTTPClientConfiguration & client_configuration,
             Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy sign_payloads,
-            bool use_virtual_addressing);
+            const ClientSettings & client_settings);
 
     std::unique_ptr<Client> clone() const;
 
@@ -194,7 +211,6 @@ public:
     Model::DeleteObjectsOutcome DeleteObjects(DeleteObjectsRequest & request) const;
 
     using ComposeObjectOutcome = Aws::Utils::Outcome<Aws::NoResult, Aws::S3::S3Error>;
-    ComposeObjectOutcome ComposeObject(ComposeObjectRequest & request) const;
 
     using Aws::S3::S3Client::EnableRequestProcessing;
     using Aws::S3::S3Client::DisableRequestProcessing;
@@ -211,7 +227,7 @@ private:
            const std::shared_ptr<Aws::Auth::AWSCredentialsProvider> & credentials_provider_,
            const PocoHTTPClientConfiguration & client_configuration,
            Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy sign_payloads,
-           bool use_virtual_addressing);
+           const ClientSettings & client_settings_);
 
     Client(
         const Client & other, const PocoHTTPClientConfiguration & client_configuration);
@@ -234,6 +250,8 @@ private:
     using Aws::S3::S3Client::DeleteObject;
     using Aws::S3::S3Client::DeleteObjects;
 
+    ComposeObjectOutcome ComposeObject(ComposeObjectRequest & request) const;
+
     template <typename RequestType, typename RequestFn>
     std::invoke_result_t<RequestFn, RequestType>
     doRequest(RequestType & request, RequestFn request_fn) const;
@@ -256,7 +274,7 @@ private:
     std::shared_ptr<Aws::Auth::AWSCredentialsProvider> credentials_provider;
     PocoHTTPClientConfiguration client_configuration;
     Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy sign_payloads;
-    bool use_virtual_addressing;
+    ClientSettings client_settings;
 
     std::string explicit_region;
     mutable bool detect_region = true;
@@ -286,7 +304,7 @@ public:
 
     std::unique_ptr<S3::Client> create(
         const PocoHTTPClientConfiguration & cfg,
-        bool is_virtual_hosted_style,
+        ClientSettings client_settings,
         const String & access_key_id,
         const String & secret_access_key,
         const String & server_side_encryption_customer_key_base64,
diff --git a/src/IO/S3/Credentials.h b/src/IO/S3/Credentials.h
index ad73de23486..5e83ea30798 100644
--- a/src/IO/S3/Credentials.h
+++ b/src/IO/S3/Credentials.h
@@ -19,6 +19,9 @@ namespace DB::S3
 {
 
 inline static constexpr uint64_t DEFAULT_EXPIRATION_WINDOW_SECONDS = 120;
+inline static constexpr uint64_t DEFAULT_CONNECT_TIMEOUT_MS = 1000;
+inline static constexpr uint64_t DEFAULT_REQUEST_TIMEOUT_MS = 30000;
+inline static constexpr uint64_t DEFAULT_MAX_CONNECTIONS = 100;
 
 /// In GCP metadata service can be accessed via DNS regardless of IPv4 or IPv6.
 static inline constexpr char GCP_METADATA_SERVICE_ENDPOINT[] = "http://metadata.google.internal";
diff --git a/src/IO/S3/PocoHTTPClientFactory.cpp b/src/IO/S3/PocoHTTPClientFactory.cpp
index 9dd52a263b0..ef7af2d01ba 100644
--- a/src/IO/S3/PocoHTTPClientFactory.cpp
+++ b/src/IO/S3/PocoHTTPClientFactory.cpp
@@ -13,9 +13,9 @@
 namespace DB::S3
 {
 std::shared_ptr<Aws::Http::HttpClient>
-PocoHTTPClientFactory::CreateHttpClient(const Aws::Client::ClientConfiguration & clientConfiguration) const
+PocoHTTPClientFactory::CreateHttpClient(const Aws::Client::ClientConfiguration & client_configuration) const
 {
-    return std::make_shared<PocoHTTPClient>(static_cast<const PocoHTTPClientConfiguration &>(clientConfiguration));
+    return std::make_shared<PocoHTTPClient>(static_cast<const PocoHTTPClientConfiguration &>(client_configuration));
 }
 
 std::shared_ptr<Aws::Http::HttpRequest> PocoHTTPClientFactory::CreateHttpRequest(
diff --git a/src/IO/S3/PocoHTTPClientFactory.h b/src/IO/S3/PocoHTTPClientFactory.h
index 4e555f05502..60704332e7b 100644
--- a/src/IO/S3/PocoHTTPClientFactory.h
+++ b/src/IO/S3/PocoHTTPClientFactory.h
@@ -15,7 +15,7 @@ class PocoHTTPClientFactory : public Aws::Http::HttpClientFactory
 public:
     ~PocoHTTPClientFactory() override = default;
     [[nodiscard]] std::shared_ptr<Aws::Http::HttpClient>
-    CreateHttpClient(const Aws::Client::ClientConfiguration & clientConfiguration) const override;
+    CreateHttpClient(const Aws::Client::ClientConfiguration & client_configuration) const override;
     [[nodiscard]] std::shared_ptr<Aws::Http::HttpRequest>
     CreateHttpRequest(const Aws::String & uri, Aws::Http::HttpMethod method, const Aws::IOStreamFactory & streamFactory) const override;
     [[nodiscard]] std::shared_ptr<Aws::Http::HttpRequest>
diff --git a/src/IO/S3/Requests.h b/src/IO/S3/Requests.h
index 560ba9b2775..bfb94a5a67e 100644
--- a/src/IO/S3/Requests.h
+++ b/src/IO/S3/Requests.h
@@ -47,6 +47,22 @@ public:
         return params;
     }
 
+    Aws::String GetChecksumAlgorithmName() const override
+    {
+        /// Return empty string is enough to disable checksums (see
+        /// AWSClient::AddChecksumToRequest [1] for more details).
+        ///
+        ///   [1]: https://github.com/aws/aws-sdk-cpp/blob/b0ee1c0d336dbb371c34358b68fba6c56aae2c92/src/aws-cpp-sdk-core/source/client/AWSClient.cpp#L783-L839
+        if (!checksum)
+            return "";
+        return BaseRequest::GetChecksumAlgorithmName();
+    }
+
+    std::string getRegionOverride() const
+    {
+        return region_override;
+    }
+
     void overrideRegion(std::string region) const
     {
         region_override = std::move(region);
@@ -67,10 +83,17 @@ public:
         api_mode = api_mode_;
     }
 
+    /// Disable checksum to avoid extra read of the input stream
+    void disableChecksum() const
+    {
+        checksum = false;
+    }
+
 protected:
     mutable std::string region_override;
     mutable std::optional<S3::URI> uri_override;
     mutable ApiMode api_mode{ApiMode::AWS};
+    mutable bool checksum = true;
 };
 
 class CopyObjectRequest : public ExtendedRequest<Model::CopyObjectRequest>
diff --git a/src/IO/S3/URI.cpp b/src/IO/S3/URI.cpp
index e05e0882329..e990875dd2f 100644
--- a/src/IO/S3/URI.cpp
+++ b/src/IO/S3/URI.cpp
@@ -146,6 +146,12 @@ URI::URI(const std::string & uri_)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Bucket or key name are invalid in S3 URI.");
 }
 
+void URI::addRegionToURI(const std::string &region)
+{
+    if (auto pos = endpoint.find("amazonaws.com"); pos != std::string::npos)
+        endpoint = endpoint.substr(0, pos) + region + "." + endpoint.substr(pos);
+}
+
 void URI::validateBucket(const String & bucket, const Poco::URI & uri)
 {
     /// S3 specification requires at least 3 and at most 63 characters in bucket name.
diff --git a/src/IO/S3/URI.h b/src/IO/S3/URI.h
index f8f40cf9108..2873728bc78 100644
--- a/src/IO/S3/URI.h
+++ b/src/IO/S3/URI.h
@@ -32,6 +32,7 @@ struct URI
 
     URI() = default;
     explicit URI(const std::string & uri_);
+    void addRegionToURI(const std::string & region);
 
     static void validateBucket(const std::string & bucket, const Poco::URI & uri);
 };
diff --git a/src/IO/S3/copyS3File.cpp b/src/IO/S3/copyS3File.cpp
index 819c345938d..25de61360fe 100644
--- a/src/IO/S3/copyS3File.cpp
+++ b/src/IO/S3/copyS3File.cpp
@@ -655,6 +655,7 @@ namespace
 
         void performCopy()
         {
+            LOG_TEST(log, "Copy object {} to {} using native copy", src_key, dest_key);
             if (!supports_multipart_copy || size <= upload_settings.max_single_operation_copy_size)
                 performSingleOperationCopy();
             else
diff --git a/src/IO/S3/tests/gtest_aws_s3_client.cpp b/src/IO/S3/tests/gtest_aws_s3_client.cpp
index 2afa5d4b8e8..33917314bca 100644
--- a/src/IO/S3/tests/gtest_aws_s3_client.cpp
+++ b/src/IO/S3/tests/gtest_aws_s3_client.cpp
@@ -94,7 +94,7 @@ void doWriteRequest(std::shared_ptr<const DB::S3::Client> client, const DB::S3::
         client,
         uri.bucket,
         uri.key,
-        DBMS_DEFAULT_BUFFER_SIZE,
+        DB::DBMS_DEFAULT_BUFFER_SIZE,
         request_settings,
         {}
     );
@@ -107,6 +107,7 @@ using RequestFn = std::function<void(std::shared_ptr<const DB::S3::Client>, cons
 
 void testServerSideEncryption(
     RequestFn do_request,
+    bool disable_checksum,
     String server_side_encryption_customer_key_base64,
     DB::S3::ServerSideEncryptionKMSConfig sse_kms_config,
     String expected_headers)
@@ -139,9 +140,15 @@ void testServerSideEncryption(
     bool use_environment_credentials = false;
     bool use_insecure_imds_request = false;
 
+    DB::S3::ClientSettings client_settings{
+        .use_virtual_addressing = uri.is_virtual_hosted_style,
+        .disable_checksum = disable_checksum,
+        .gcs_issue_compose_request = false,
+    };
+
     std::shared_ptr<DB::S3::Client> client = DB::S3::ClientFactory::instance().create(
         client_configuration,
-        uri.is_virtual_hosted_style,
+        client_settings,
         access_key_id,
         secret_access_key,
         server_side_encryption_customer_key_base64,
@@ -166,6 +173,7 @@ TEST(IOTestAwsS3Client, AppendExtraSSECHeadersRead)
     /// See https://github.com/ClickHouse/ClickHouse/pull/19748
     testServerSideEncryption(
         doReadRequest,
+        /* disable_checksum= */ false,
         "Kv/gDqdWVGIT4iDqg+btQvV3lc1idlm4WI+MMOyHOAw=",
         {},
         "authorization: ... SignedHeaders="
@@ -190,6 +198,7 @@ TEST(IOTestAwsS3Client, AppendExtraSSECHeadersWrite)
     /// See https://github.com/ClickHouse/ClickHouse/pull/19748
     testServerSideEncryption(
         doWriteRequest,
+        /* disable_checksum= */ false,
         "Kv/gDqdWVGIT4iDqg+btQvV3lc1idlm4WI+MMOyHOAw=",
         {},
         "authorization: ... SignedHeaders="
@@ -209,6 +218,30 @@ TEST(IOTestAwsS3Client, AppendExtraSSECHeadersWrite)
         "x-amz-server-side-encryption-customer-key-md5: fMNuOw6OLU5GG2vc6RTA+g==\n");
 }
 
+TEST(IOTestAwsS3Client, AppendExtraSSECHeadersWriteDisableChecksum)
+{
+    /// See https://github.com/ClickHouse/ClickHouse/pull/19748
+    testServerSideEncryption(
+        doWriteRequest,
+        /* disable_checksum= */ true,
+        "Kv/gDqdWVGIT4iDqg+btQvV3lc1idlm4WI+MMOyHOAw=",
+        {},
+        "authorization: ... SignedHeaders="
+        "amz-sdk-invocation-id;"
+        "amz-sdk-request;"
+        "content-length;"
+        "content-type;"
+        "host;"
+        "x-amz-content-sha256;"
+        "x-amz-date;"
+        "x-amz-server-side-encryption-customer-algorithm;"
+        "x-amz-server-side-encryption-customer-key;"
+        "x-amz-server-side-encryption-customer-key-md5, ...\n"
+        "x-amz-server-side-encryption-customer-algorithm: AES256\n"
+        "x-amz-server-side-encryption-customer-key: Kv/gDqdWVGIT4iDqg+btQvV3lc1idlm4WI+MMOyHOAw=\n"
+        "x-amz-server-side-encryption-customer-key-md5: fMNuOw6OLU5GG2vc6RTA+g==\n");
+}
+
 TEST(IOTestAwsS3Client, AppendExtraSSEKMSHeadersRead)
 {
     DB::S3::ServerSideEncryptionKMSConfig sse_kms_config;
@@ -218,6 +251,7 @@ TEST(IOTestAwsS3Client, AppendExtraSSEKMSHeadersRead)
     // KMS headers shouldn't be set on a read request
     testServerSideEncryption(
         doReadRequest,
+        /* disable_checksum= */ false,
         "",
         sse_kms_config,
         "authorization: ... SignedHeaders="
@@ -239,6 +273,7 @@ TEST(IOTestAwsS3Client, AppendExtraSSEKMSHeadersWrite)
     sse_kms_config.bucket_key_enabled = true;
     testServerSideEncryption(
         doWriteRequest,
+        /* disable_checksum= */ false,
         "",
         sse_kms_config,
         "authorization: ... SignedHeaders="
diff --git a/src/IO/S3Common.cpp b/src/IO/S3Common.cpp
index ffd6b6d711f..96ad6413ef5 100644
--- a/src/IO/S3Common.cpp
+++ b/src/IO/S3Common.cpp
@@ -109,6 +109,8 @@ AuthSettings AuthSettings::loadFromConfig(const std::string & config_elem, const
 {
     auto access_key_id = config.getString(config_elem + ".access_key_id", "");
     auto secret_access_key = config.getString(config_elem + ".secret_access_key", "");
+    auto session_token = config.getString(config_elem + ".session_token", "");
+
     auto region = config.getString(config_elem + ".region", "");
     auto server_side_encryption_customer_key_base64 = config.getString(config_elem + ".server_side_encryption_customer_key_base64", "");
 
@@ -133,7 +135,7 @@ AuthSettings AuthSettings::loadFromConfig(const std::string & config_elem, const
 
     return AuthSettings
     {
-        std::move(access_key_id), std::move(secret_access_key),
+        std::move(access_key_id), std::move(secret_access_key), std::move(session_token),
         std::move(region),
         std::move(server_side_encryption_customer_key_base64),
         std::move(sse_kms_config),
@@ -155,6 +157,8 @@ void AuthSettings::updateFrom(const AuthSettings & from)
         access_key_id = from.access_key_id;
     if (!from.secret_access_key.empty())
         secret_access_key = from.secret_access_key;
+    if (!from.session_token.empty())
+        session_token = from.session_token;
 
     headers = from.headers;
     region = from.region;
diff --git a/src/IO/S3Common.h b/src/IO/S3Common.h
index 71d52c727c7..ebfc07a3976 100644
--- a/src/IO/S3Common.h
+++ b/src/IO/S3Common.h
@@ -16,6 +16,7 @@
 #include <Common/Throttler_fwd.h>
 
 #include <IO/S3/URI.h>
+#include <IO/S3/Credentials.h>
 
 #include <aws/core/Aws.h>
 #include <aws/s3/S3Errors.h>
@@ -79,6 +80,7 @@ struct AuthSettings
 
     std::string access_key_id;
     std::string secret_access_key;
+    std::string session_token;
     std::string region;
     std::string server_side_encryption_customer_key_base64;
     ServerSideEncryptionKMSConfig server_side_encryption_kms_config;
diff --git a/src/IO/SharedThreadPools.cpp b/src/IO/SharedThreadPools.cpp
index 6af5aab7a38..c8506663bc8 100644
--- a/src/IO/SharedThreadPools.cpp
+++ b/src/IO/SharedThreadPools.cpp
@@ -66,6 +66,8 @@ void StaticThreadPool::reloadConfiguration(size_t max_threads, size_t max_free_t
     if (!instance)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "The {} is not initialized", name);
 
+    std::lock_guard lock(mutex);
+
     instance->setMaxThreads(turbo_mode_enabled > 0 ? max_threads_turbo : max_threads);
     instance->setMaxFreeThreads(max_free_threads);
     instance->setQueueSize(queue_size);
diff --git a/src/IO/SynchronousReader.cpp b/src/IO/SynchronousReader.cpp
index 07cc2fd0778..5061439bfd6 100644
--- a/src/IO/SynchronousReader.cpp
+++ b/src/IO/SynchronousReader.cpp
@@ -43,7 +43,7 @@ std::future<IAsynchronousReader::Result> SynchronousReader::submit(Request reque
 #if defined(POSIX_FADV_WILLNEED)
     int fd = assert_cast<const LocalFileDescriptor &>(*request.descriptor).fd;
     if (0 != posix_fadvise(fd, request.offset, request.size, POSIX_FADV_WILLNEED))
-        throwFromErrno("Cannot posix_fadvise", ErrorCodes::CANNOT_ADVISE);
+        throw ErrnoException(ErrorCodes::CANNOT_ADVISE, "Cannot posix_fadvise");
 #endif
 
     return std::async(std::launch::deferred, [request, this]
@@ -73,7 +73,7 @@ IAsynchronousReader::Result SynchronousReader::execute(Request request)
         if (-1 == res && errno != EINTR)
         {
             ProfileEvents::increment(ProfileEvents::ReadBufferFromFileDescriptorReadFailed);
-            throwFromErrno(fmt::format("Cannot read from file {}", fd), ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+            throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, "Cannot read from file {}", fd);
         }
 
         if (res > 0)
diff --git a/src/IO/WriteBufferFromFile.cpp b/src/IO/WriteBufferFromFile.cpp
index 97059ff8f48..0ca6c26f08c 100644
--- a/src/IO/WriteBufferFromFile.cpp
+++ b/src/IO/WriteBufferFromFile.cpp
@@ -46,14 +46,14 @@ WriteBufferFromFile::WriteBufferFromFile(
     fd = ::open(file_name.c_str(), flags == -1 ? O_WRONLY | O_TRUNC | O_CREAT | O_CLOEXEC : flags | O_CLOEXEC, mode);
 
     if (-1 == fd)
-        throwFromErrnoWithPath("Cannot open file " + file_name, file_name,
-                               errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE);
+        ErrnoException::throwFromPath(
+            errno == ENOENT ? ErrorCodes::FILE_DOESNT_EXIST : ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot open file {}", file_name);
 
 #ifdef OS_DARWIN
     if (o_direct)
     {
         if (fcntl(fd, F_NOCACHE, 1) == -1)
-            throwFromErrnoWithPath("Cannot set F_NOCACHE on file " + file_name, file_name, ErrorCodes::CANNOT_OPEN_FILE);
+            ErrnoException::throwFromPath(ErrorCodes::CANNOT_OPEN_FILE, file_name, "Cannot set F_NOCACHE on file {}", file_name);
     }
 #endif
 }
diff --git a/src/IO/WriteBufferFromFileDescriptor.cpp b/src/IO/WriteBufferFromFileDescriptor.cpp
index 135ff608967..813ef0deab9 100644
--- a/src/IO/WriteBufferFromFileDescriptor.cpp
+++ b/src/IO/WriteBufferFromFileDescriptor.cpp
@@ -69,8 +69,8 @@ void WriteBufferFromFileDescriptor::nextImpl()
             String error_file_name = file_name;
             if (error_file_name.empty())
                 error_file_name = "(fd = " + toString(fd) + ")";
-            throwFromErrnoWithPath("Cannot write to file " + error_file_name, error_file_name,
-                                   ErrorCodes::CANNOT_WRITE_TO_FILE_DESCRIPTOR);
+            ErrnoException::throwFromPath(
+                ErrorCodes::CANNOT_WRITE_TO_FILE_DESCRIPTOR, error_file_name, "Cannot write to file {}", error_file_name);
         }
 
         if (res > 0)
@@ -137,7 +137,7 @@ void WriteBufferFromFileDescriptor::sync()
     ProfileEvents::increment(ProfileEvents::FileSyncElapsedMicroseconds, watch.elapsedMicroseconds());
 
     if (-1 == res)
-        throwFromErrnoWithPath("Cannot fsync " + getFileName(), getFileName(), ErrorCodes::CANNOT_FSYNC);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_FSYNC, getFileName(), "Cannot fsync {}", getFileName());
 }
 
 
@@ -145,8 +145,7 @@ off_t WriteBufferFromFileDescriptor::seek(off_t offset, int whence) // NOLINT
 {
     off_t res = lseek(fd, offset, whence);
     if (-1 == res)
-        throwFromErrnoWithPath("Cannot seek through file " + getFileName(), getFileName(),
-                               ErrorCodes::CANNOT_SEEK_THROUGH_FILE);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_SEEK_THROUGH_FILE, getFileName(), "Cannot seek through {}", getFileName());
     return res;
 }
 
@@ -154,7 +153,7 @@ void WriteBufferFromFileDescriptor::truncate(off_t length) // NOLINT
 {
     int res = ftruncate(fd, length);
     if (-1 == res)
-        throwFromErrnoWithPath("Cannot truncate file " + getFileName(), getFileName(), ErrorCodes::CANNOT_TRUNCATE_FILE);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_TRUNCATE_FILE, getFileName(), "Cannot truncate file {}", getFileName());
 }
 
 
@@ -163,7 +162,7 @@ off_t WriteBufferFromFileDescriptor::size() const
     struct stat buf;
     int res = fstat(fd, &buf);
     if (-1 == res)
-        throwFromErrnoWithPath("Cannot execute fstat " + getFileName(), getFileName(), ErrorCodes::CANNOT_FSTAT);
+        ErrnoException::throwFromPath(ErrorCodes::CANNOT_FSTAT, getFileName(), "Cannot execute fstat {}", getFileName());
     return buf.st_size;
 }
 
diff --git a/src/IO/examples/lzma_buffers.cpp b/src/IO/examples/lzma_buffers.cpp
index 126a192737b..f9e4fc0c5db 100644
--- a/src/IO/examples/lzma_buffers.cpp
+++ b/src/IO/examples/lzma_buffers.cpp
@@ -19,7 +19,7 @@ try
 
     {
         auto buf
-            = std::make_unique<DB::WriteBufferFromFile>("test_lzma_buffers.xz", DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
+            = std::make_unique<DB::WriteBufferFromFile>("test_lzma_buffers.xz", DB::DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
         DB::LZMADeflatingWriteBuffer lzma_buf(std::move(buf), /*compression level*/ 3);
 
         stopwatch.restart();
diff --git a/src/IO/examples/zlib_buffers.cpp b/src/IO/examples/zlib_buffers.cpp
index a36b7a7a41d..1497e2c3f8e 100644
--- a/src/IO/examples/zlib_buffers.cpp
+++ b/src/IO/examples/zlib_buffers.cpp
@@ -21,7 +21,7 @@ try
     Stopwatch stopwatch;
 
     {
-        auto buf = std::make_unique<DB::WriteBufferFromFile>("test_zlib_buffers.gz", DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
+        auto buf = std::make_unique<DB::WriteBufferFromFile>("test_zlib_buffers.gz", DB::DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
         DB::ZlibDeflatingWriteBuffer deflating_buf(std::move(buf), DB::CompressionMethod::Gzip, /* compression_level = */ 3);
 
         stopwatch.restart();
diff --git a/src/IO/examples/zstd_buffers.cpp b/src/IO/examples/zstd_buffers.cpp
index 26c8899605a..dc9913b81a6 100644
--- a/src/IO/examples/zstd_buffers.cpp
+++ b/src/IO/examples/zstd_buffers.cpp
@@ -21,7 +21,7 @@ try
 
     {
         auto buf
-            = std::make_unique<DB::WriteBufferFromFile>("test_zstd_buffers.zst", DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
+            = std::make_unique<DB::WriteBufferFromFile>("test_zstd_buffers.zst", DB::DBMS_DEFAULT_BUFFER_SIZE, O_WRONLY | O_CREAT | O_TRUNC);
         DB::ZstdDeflatingWriteBuffer zstd_buf(std::move(buf), /*compression level*/ 3);
 
         stopwatch.restart();
diff --git a/src/IO/parseDateTimeBestEffort.cpp b/src/IO/parseDateTimeBestEffort.cpp
index 83fde8e8830..9734ba1c84f 100644
--- a/src/IO/parseDateTimeBestEffort.cpp
+++ b/src/IO/parseDateTimeBestEffort.cpp
@@ -95,7 +95,7 @@ ReturnType parseDateTimeBestEffortImpl(
                                              FmtArgs && ...fmt_args [[maybe_unused]])
     {
         if constexpr (std::is_same_v<ReturnType, void>)
-            throw ParsingException(error_code, std::move(fmt_string), std::forward<FmtArgs>(fmt_args)...);
+            throw Exception(error_code, std::move(fmt_string), std::forward<FmtArgs>(fmt_args)...);
         else
             return false;
     };
diff --git a/src/IO/readDecimalText.h b/src/IO/readDecimalText.h
index 9fd9c439b87..3417310a990 100644
--- a/src/IO/readDecimalText.h
+++ b/src/IO/readDecimalText.h
@@ -121,7 +121,7 @@ inline bool readDigits(ReadBuffer & buf, T & x, uint32_t & digits, int32_t & exp
                 if (!tryReadIntText(addition_exp, buf))
                 {
                     if constexpr (_throw_on_error)
-                        throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot parse exponent while reading decimal");
+                        throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot parse exponent while reading decimal");
                     else
                         return false;
                 }
@@ -134,7 +134,7 @@ inline bool readDigits(ReadBuffer & buf, T & x, uint32_t & digits, int32_t & exp
                 if (digits_only)
                 {
                     if constexpr (_throw_on_error)
-                        throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Unexpected symbol while reading decimal");
+                        throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Unexpected symbol while reading decimal");
                     return false;
                 }
                 stop = true;
diff --git a/src/IO/readFloatText.h b/src/IO/readFloatText.h
index b0682576183..23e904f305a 100644
--- a/src/IO/readFloatText.h
+++ b/src/IO/readFloatText.h
@@ -160,7 +160,7 @@ ReturnType readFloatTextPreciseImpl(T & x, ReadBuffer & buf)
         if (unlikely(res.ec != std::errc()))
         {
             if constexpr (throw_exception)
-                throw ParsingException(
+                throw Exception(
                     ErrorCodes::CANNOT_PARSE_NUMBER,
                     "Cannot read floating point value here: {}",
                     String(initial_position, buf.buffer().end() - initial_position));
@@ -253,7 +253,7 @@ ReturnType readFloatTextPreciseImpl(T & x, ReadBuffer & buf)
         if (unlikely(res.ec != std::errc() || res.ptr - tmp_buf != num_copied_chars))
         {
             if constexpr (throw_exception)
-                throw ParsingException(
+                throw Exception(
                     ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value here: {}", String(tmp_buf, num_copied_chars));
             else
                 return ReturnType(false);
@@ -342,7 +342,7 @@ ReturnType readFloatTextFastImpl(T & x, ReadBuffer & in)
     if (in.eof())
     {
         if constexpr (throw_exception)
-            throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value");
+            throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value");
         else
             return false;
     }
@@ -400,7 +400,7 @@ ReturnType readFloatTextFastImpl(T & x, ReadBuffer & in)
         if (in.eof())
         {
             if constexpr (throw_exception)
-                throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: nothing after exponent");
+                throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: nothing after exponent");
             else
                 return false;
         }
@@ -438,7 +438,7 @@ ReturnType readFloatTextFastImpl(T & x, ReadBuffer & in)
         if (in.eof())
         {
             if constexpr (throw_exception)
-                throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: no digits read");
+                throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: no digits read");
             else
                 return false;
         }
@@ -449,14 +449,14 @@ ReturnType readFloatTextFastImpl(T & x, ReadBuffer & in)
             if (in.eof())
             {
                 if constexpr (throw_exception)
-                    throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: nothing after plus sign");
+                    throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: nothing after plus sign");
                 else
                     return false;
             }
             else if (negative)
             {
                 if constexpr (throw_exception)
-                    throw ParsingException(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: plus after minus sign");
+                    throw Exception(ErrorCodes::CANNOT_PARSE_NUMBER, "Cannot read floating point value: plus after minus sign");
                 else
                     return false;
             }
diff --git a/src/IO/tests/gtest_archive_reader_and_writer.cpp b/src/IO/tests/gtest_archive_reader_and_writer.cpp
index b48955c25e7..37fbdff901a 100644
--- a/src/IO/tests/gtest_archive_reader_and_writer.cpp
+++ b/src/IO/tests/gtest_archive_reader_and_writer.cpp
@@ -102,7 +102,8 @@ TEST_P(ArchiveReaderAndWriterTest, EmptyArchive)
 {
     /// Make an archive.
     {
-        createArchiveWriter(getPathToArchive());
+        auto writer = createArchiveWriter(getPathToArchive());
+        writer->finalize();
     }
 
     /// The created archive can be found in the local filesystem.
@@ -132,7 +133,9 @@ TEST_P(ArchiveReaderAndWriterTest, SingleFileInArchive)
         {
             auto out = writer->writeFile("a.txt");
             writeString(contents, *out);
+            out->finalize();
         }
+        writer->finalize();
     }
 
     /// Read the archive.
@@ -198,11 +201,14 @@ TEST_P(ArchiveReaderAndWriterTest, TwoFilesInArchive)
         {
             auto out = writer->writeFile("a.txt");
             writeString(a_contents, *out);
+            out->finalize();
         }
         {
             auto out = writer->writeFile("b/c.txt");
             writeString(c_contents, *out);
+            out->finalize();
         }
+        writer->finalize();
     }
 
     /// Read the archive.
@@ -281,11 +287,14 @@ TEST_P(ArchiveReaderAndWriterTest, InMemory)
         {
             auto out = writer->writeFile("a.txt");
             writeString(a_contents, *out);
+            out->finalize();
         }
         {
             auto out = writer->writeFile("b.txt");
             writeString(b_contents, *out);
+            out->finalize();
         }
+        writer->finalize();
     }
 
     /// The created archive is really in memory.
@@ -335,7 +344,9 @@ TEST_P(ArchiveReaderAndWriterTest, Password)
         {
             auto out = writer->writeFile("a.txt");
             writeString(contents, *out);
+            out->finalize();
         }
+        writer->finalize();
     }
 
     /// Read the archive.
diff --git a/src/IO/tests/gtest_writebuffer_s3.cpp b/src/IO/tests/gtest_writebuffer_s3.cpp
index 41ba6a2779d..7210dc6fbbf 100644
--- a/src/IO/tests/gtest_writebuffer_s3.cpp
+++ b/src/IO/tests/gtest_writebuffer_s3.cpp
@@ -210,9 +210,13 @@ struct Client : DB::S3::Client
                std::make_shared<Aws::Auth::SimpleAWSCredentialsProvider>("", ""),
                GetClientConfiguration(),
                Aws::Client::AWSAuthV4Signer::PayloadSigningPolicy::Never,
-               /* use_virtual_addressing = */ true)
+               DB::S3::ClientSettings{
+                   .use_virtual_addressing = true,
+                   .disable_checksum= false,
+                   .gcs_issue_compose_request = false,
+               })
         , store(mock_s3_store)
-    { }
+    {}
 
     static std::shared_ptr<Client> CreateClient(String bucket = "mock-s3-bucket")
     {
diff --git a/src/Interpreters/Access/InterpreterGrantQuery.cpp b/src/Interpreters/Access/InterpreterGrantQuery.cpp
index 45e8ba9ea0d..259c6b39524 100644
--- a/src/Interpreters/Access/InterpreterGrantQuery.cpp
+++ b/src/Interpreters/Access/InterpreterGrantQuery.cpp
@@ -7,6 +7,7 @@
 #include <Access/RolesOrUsersSet.h>
 #include <Access/User.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/removeOnClusterClauseIfNeeded.h>
 #include <Interpreters/QueryLog.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
 #include <boost/range/algorithm/copy.hpp>
@@ -396,7 +397,8 @@ namespace
 
 BlockIO InterpreterGrantQuery::execute()
 {
-    auto & query = query_ptr->as<ASTGrantQuery &>();
+    const auto updated_query = removeOnClusterClauseIfNeeded(query_ptr, getContext());
+    auto & query = updated_query->as<ASTGrantQuery &>();
 
     query.replaceCurrentUserTag(getContext()->getUserName());
     query.access_rights_elements.eraseNonGrantable();
@@ -430,7 +432,7 @@ BlockIO InterpreterGrantQuery::execute()
         current_user_access->checkGranteesAreAllowed(grantees);
         DDLQueryOnClusterParams params;
         params.access_to_check = std::move(required_access);
-        return executeDDLQueryOnCluster(query_ptr, getContext(), params);
+        return executeDDLQueryOnCluster(updated_query, getContext(), params);
     }
 
     /// Check if the current user has corresponding access rights granted with grant option.
diff --git a/src/Interpreters/ActionLocksManager.cpp b/src/Interpreters/ActionLocksManager.cpp
index fb5ef4b98ae..65f13ebd66c 100644
--- a/src/Interpreters/ActionLocksManager.cpp
+++ b/src/Interpreters/ActionLocksManager.cpp
@@ -18,6 +18,7 @@ namespace ActionLocks
     extern const StorageActionBlockType PartsMove = 7;
     extern const StorageActionBlockType PullReplicationLog = 8;
     extern const StorageActionBlockType Cleanup = 9;
+    extern const StorageActionBlockType ViewRefresh = 10;
 }
 
 
diff --git a/src/Interpreters/ActionsDAG.h b/src/Interpreters/ActionsDAG.h
index 94b6b1ac41d..f18ae5d5c75 100644
--- a/src/Interpreters/ActionsDAG.h
+++ b/src/Interpreters/ActionsDAG.h
@@ -115,6 +115,7 @@ public:
     explicit ActionsDAG(const ColumnsWithTypeAndName & inputs_);
 
     const Nodes & getNodes() const { return nodes; }
+    static Nodes detachNodes(ActionsDAG && dag) { return std::move(dag.nodes); }
     const NodeRawConstPtrs & getOutputs() const { return outputs; }
     /** Output nodes can contain any column returned from DAG.
       * You may manually change it if needed.
diff --git a/src/Interpreters/ActionsVisitor.cpp b/src/Interpreters/ActionsVisitor.cpp
index 6be9f6c803f..827914eaefe 100644
--- a/src/Interpreters/ActionsVisitor.cpp
+++ b/src/Interpreters/ActionsVisitor.cpp
@@ -1414,7 +1414,10 @@ FutureSetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool
             set_key = right_in_operand->getTreeHash(/*ignore_aliases=*/ true);
 
         if (auto set = data.prepared_sets->findSubquery(set_key))
+        {
+            set->markAsINSubquery();
             return set;
+        }
 
         FutureSetPtr external_table_set;
 
@@ -1460,7 +1463,8 @@ FutureSetPtr ActionsMatcher::makeSet(const ASTFunction & node, Data & data, bool
             interpreter->buildQueryPlan(*source);
         }
 
-        return data.prepared_sets->addFromSubquery(set_key, std::move(source), nullptr, std::move(external_table_set), data.getContext()->getSettingsRef());
+        return data.prepared_sets->addFromSubquery(
+            set_key, std::move(source), nullptr, std::move(external_table_set), data.getContext()->getSettingsRef(), /*in_subquery=*/true);
     }
     else
     {
diff --git a/src/Interpreters/AddDefaultDatabaseVisitor.h b/src/Interpreters/AddDefaultDatabaseVisitor.h
index 08d159b42ca..b977a73d461 100644
--- a/src/Interpreters/AddDefaultDatabaseVisitor.h
+++ b/src/Interpreters/AddDefaultDatabaseVisitor.h
@@ -5,6 +5,7 @@
 #include <Parsers/ASTQueryWithTableAndOutput.h>
 #include <Parsers/ASTRenameQuery.h>
 #include <Parsers/ASTIdentifier.h>
+#include <Parsers/ASTRefreshStrategy.h>
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTSubquery.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
@@ -87,6 +88,12 @@ public:
             visit(child);
     }
 
+    void visit(ASTRefreshStrategy & refresh) const
+    {
+        ASTPtr unused;
+        visit(refresh, unused);
+    }
+
 private:
 
     ContextPtr context;
@@ -148,8 +155,6 @@ private:
     {
         if (table_expression.database_and_table_name)
             tryVisit<ASTTableIdentifier>(table_expression.database_and_table_name);
-        else if (table_expression.subquery)
-            tryVisit<ASTSubquery>(table_expression.subquery);
     }
 
     void visit(const ASTTableIdentifier & identifier, ASTPtr & ast) const
@@ -167,11 +172,6 @@ private:
         ast = qualified_identifier;
     }
 
-    void visit(ASTSubquery & subquery, ASTPtr &) const
-    {
-        tryVisit<ASTSelectWithUnionQuery>(subquery.children[0]);
-    }
-
     void visit(ASTFunction & function, ASTPtr &) const
     {
         bool is_operator_in = functionIsInOrGlobalInOperator(function.name);
@@ -236,6 +236,13 @@ private:
         }
     }
 
+    void visit(ASTRefreshStrategy & refresh, ASTPtr &) const
+    {
+        if (refresh.dependencies)
+            for (auto & table : refresh.dependencies->children)
+                tryVisit<ASTTableIdentifier>(table);
+    }
+
     void visitChildren(IAST & ast) const
     {
         for (auto & child : ast.children)
diff --git a/src/Interpreters/Aggregator.cpp b/src/Interpreters/Aggregator.cpp
index b43edfb8d3e..07c52d50e18 100644
--- a/src/Interpreters/Aggregator.cpp
+++ b/src/Interpreters/Aggregator.cpp
@@ -664,26 +664,26 @@ void Aggregator::compileAggregateFunctionsIfNeeded()
     for (size_t i = 0; i < aggregate_functions.size(); ++i)
     {
         const auto * function = aggregate_functions[i];
+        bool function_is_compilable = function->isCompilable();
+        if (!function_is_compilable)
+            continue;
+
         size_t offset_of_aggregate_function = offsets_of_aggregate_states[i];
-
-        if (function->isCompilable())
+        AggregateFunctionWithOffset function_to_compile
         {
-            AggregateFunctionWithOffset function_to_compile
-            {
-                .function = function,
-                .aggregate_data_offset = offset_of_aggregate_function
-            };
+            .function = function,
+            .aggregate_data_offset = offset_of_aggregate_function
+        };
 
-            functions_to_compile.emplace_back(std::move(function_to_compile));
+        functions_to_compile.emplace_back(std::move(function_to_compile));
 
-            functions_description += function->getDescription();
-            functions_description += ' ';
+        functions_description += function->getDescription();
+        functions_description += ' ';
 
-            functions_description += std::to_string(offset_of_aggregate_function);
-            functions_description += ' ';
-        }
+        functions_description += std::to_string(offset_of_aggregate_function);
+        functions_description += ' ';
 
-        is_aggregate_function_compiled[i] = function->isCompilable();
+        is_aggregate_function_compiled[i] = true;
     }
 
     if (functions_to_compile.empty())
@@ -976,12 +976,12 @@ void Aggregator::executeOnBlockSmall(
             initDataVariantsWithSizeHint(result, method_chosen, params);
         else
             result.init(method_chosen);
+
         result.keys_size = params.keys_size;
         result.key_sizes = key_sizes;
     }
 
     executeImpl(result, row_begin, row_end, key_columns, aggregate_instructions);
-
     CurrentMemoryTracker::check();
 }
 
@@ -1014,7 +1014,9 @@ void Aggregator::mergeOnBlockSmall(
 #define M(NAME, IS_TWO_LEVEL) \
     else if (result.type == AggregatedDataVariants::Type::NAME) \
         mergeStreamsImpl(result.aggregates_pool, *result.NAME, result.NAME->data, \
-                         result.without_key, /* no_more_keys= */ false, \
+                         result.without_key, \
+                         result.consecutive_keys_cache_stats, \
+                         /* no_more_keys= */ false, \
                          row_begin, row_end, \
                          aggregate_columns_data, key_columns, result.aggregates_pool);
 
@@ -1038,17 +1040,14 @@ void Aggregator::executeImpl(
 {
     #define M(NAME, IS_TWO_LEVEL) \
         else if (result.type == AggregatedDataVariants::Type::NAME) \
-            executeImpl(*result.NAME, result.aggregates_pool, row_begin, row_end, key_columns, aggregate_instructions, no_more_keys, all_keys_are_const, overflow_row);
+            executeImpl(*result.NAME, result.aggregates_pool, row_begin, row_end, key_columns, aggregate_instructions, \
+                        result.consecutive_keys_cache_stats, no_more_keys, all_keys_are_const, overflow_row);
 
     if (false) {} // NOLINT
     APPLY_FOR_AGGREGATED_VARIANTS(M)
     #undef M
 }
 
-/** It's interesting - if you remove `noinline`, then gcc for some reason will inline this function, and the performance decreases (~ 10%).
-  * (Probably because after the inline of this function, more internal functions no longer be inlined.)
-  * Inline does not make sense, since the inner loop is entirely inside this function.
-  */
 template <typename Method>
 void NO_INLINE Aggregator::executeImpl(
     Method & method,
@@ -1057,12 +1056,44 @@ void NO_INLINE Aggregator::executeImpl(
     size_t row_end,
     ColumnRawPtrs & key_columns,
     AggregateFunctionInstruction * aggregate_instructions,
+    LastElementCacheStats & consecutive_keys_cache_stats,
     bool no_more_keys,
     bool all_keys_are_const,
     AggregateDataPtr overflow_row) const
 {
-    typename Method::State state(key_columns, key_sizes, aggregation_state_cache);
+    UInt64 total_rows = consecutive_keys_cache_stats.hits + consecutive_keys_cache_stats.misses;
+    double cache_hit_rate = total_rows ? static_cast<double>(consecutive_keys_cache_stats.hits) / total_rows : 1.0;
+    bool use_cache = cache_hit_rate >= params.min_hit_rate_to_use_consecutive_keys_optimization;
 
+    if (use_cache)
+    {
+        typename Method::State state(key_columns, key_sizes, aggregation_state_cache);
+        executeImpl(method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, no_more_keys, all_keys_are_const, overflow_row);
+        consecutive_keys_cache_stats.update(row_end - row_begin, state.getCacheMissesSinceLastReset());
+    }
+    else
+    {
+        typename Method::StateNoCache state(key_columns, key_sizes, aggregation_state_cache);
+        executeImpl(method, state, aggregates_pool, row_begin, row_end, aggregate_instructions, no_more_keys, all_keys_are_const, overflow_row);
+    }
+}
+
+/** It's interesting - if you remove `noinline`, then gcc for some reason will inline this function, and the performance decreases (~ 10%).
+  * (Probably because after the inline of this function, more internal functions no longer be inlined.)
+  * Inline does not make sense, since the inner loop is entirely inside this function.
+  */
+template <typename Method, typename State>
+void NO_INLINE Aggregator::executeImpl(
+    Method & method,
+    State & state,
+    Arena * aggregates_pool,
+    size_t row_begin,
+    size_t row_end,
+    AggregateFunctionInstruction * aggregate_instructions,
+    bool no_more_keys,
+    bool all_keys_are_const,
+    AggregateDataPtr overflow_row) const
+{
     if (!no_more_keys)
     {
         /// Prefetching doesn't make sense for small hash tables, because they fit in caches entirely.
@@ -1096,10 +1127,10 @@ void NO_INLINE Aggregator::executeImpl(
     }
 }
 
-template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method>
+template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method, typename State>
 void NO_INLINE Aggregator::executeImplBatch(
     Method & method,
-    typename Method::State & state,
+    State & state,
     Arena * aggregates_pool,
     size_t row_begin,
     size_t row_end,
@@ -1119,8 +1150,6 @@ void NO_INLINE Aggregator::executeImplBatch(
         if constexpr (no_more_keys)
             return;
 
-        /// For all rows.
-
         /// This pointer is unused, but the logic will compare it for nullptr to check if the cell is set.
         AggregateDataPtr place = reinterpret_cast<AggregateDataPtr>(0x1);
         if (all_keys_are_const)
@@ -1129,6 +1158,7 @@ void NO_INLINE Aggregator::executeImplBatch(
         }
         else
         {
+            /// For all rows.
             for (size_t i = row_begin; i < row_end; ++i)
             {
                 if constexpr (prefetch && HasPrefetchMemberFunc<decltype(method.data), KeyHolder>)
@@ -1191,21 +1221,23 @@ void NO_INLINE Aggregator::executeImplBatch(
     /// - and plus this will require other changes in the interface.
     std::unique_ptr<AggregateDataPtr[]> places(new AggregateDataPtr[all_keys_are_const ? 1 : row_end]);
 
-    /// For all rows.
-    size_t start, end;
+    size_t key_start, key_end;
     /// If all keys are const, key columns contain only 1 row.
     if  (all_keys_are_const)
     {
-        start = 0;
-        end = 1;
+        key_start = 0;
+        key_end = 1;
     }
     else
     {
-        start = row_begin;
-        end = row_end;
+        key_start = row_begin;
+        key_end = row_end;
     }
 
-    for (size_t i = start; i < end; ++i)
+    state.resetCache();
+
+    /// For all rows.
+    for (size_t i = key_start; i < key_end; ++i)
     {
         AggregateDataPtr aggregate_data = nullptr;
 
@@ -1213,7 +1245,7 @@ void NO_INLINE Aggregator::executeImplBatch(
         {
             if constexpr (prefetch && HasPrefetchMemberFunc<decltype(method.data), KeyHolder>)
             {
-                if (i == row_begin + prefetching.iterationsToMeasure())
+                if (i == key_start + prefetching.iterationsToMeasure())
                     prefetch_look_ahead = prefetching.calcPrefetchLookAhead();
 
                 if (i + prefetch_look_ahead < row_end)
@@ -1305,10 +1337,10 @@ void NO_INLINE Aggregator::executeImplBatch(
                 columns_data.emplace_back(getColumnData(inst->batch_arguments[argument_index]));
         }
 
-        if (all_keys_are_const)
+        if (all_keys_are_const || (!no_more_keys && state.hasOnlyOneValueSinceLastReset()))
         {
             auto add_into_aggregate_states_function_single_place = compiled_aggregate_functions_holder->compiled_aggregate_functions.add_into_aggregate_states_function_single_place;
-            add_into_aggregate_states_function_single_place(row_begin, row_end, columns_data.data(), places[0]);
+            add_into_aggregate_states_function_single_place(row_begin, row_end, columns_data.data(), places[key_start]);
         }
         else
         {
@@ -1329,24 +1361,10 @@ void NO_INLINE Aggregator::executeImplBatch(
 
         AggregateFunctionInstruction * inst = aggregate_instructions + i;
 
-        if (all_keys_are_const)
-        {
-            if (inst->offsets)
-                inst->batch_that->addBatchSinglePlace(inst->offsets[static_cast<ssize_t>(row_begin) - 1], inst->offsets[row_end - 1], places[0] + inst->state_offset, inst->batch_arguments, aggregates_pool);
-            else if (inst->has_sparse_arguments)
-                inst->batch_that->addBatchSparseSinglePlace(row_begin, row_end, places[0] + inst->state_offset, inst->batch_arguments, aggregates_pool);
-            else
-                inst->batch_that->addBatchSinglePlace(row_begin, row_end, places[0] + inst->state_offset, inst->batch_arguments, aggregates_pool);
-        }
+        if (all_keys_are_const || (!no_more_keys && state.hasOnlyOneValueSinceLastReset()))
+            addBatchSinglePlace(row_begin, row_end, inst, places[key_start] + inst->state_offset, aggregates_pool);
         else
-        {
-            if (inst->offsets)
-                inst->batch_that->addBatchArray(row_begin, row_end, places.get(), inst->state_offset, inst->batch_arguments, inst->offsets, aggregates_pool);
-            else if (inst->has_sparse_arguments)
-                inst->batch_that->addBatchSparse(row_begin, row_end, places.get(), inst->state_offset, inst->batch_arguments, aggregates_pool);
-            else
-                inst->batch_that->addBatch(row_begin, row_end, places.get(), inst->state_offset, inst->batch_arguments, aggregates_pool);
-        }
+            addBatch(row_begin, row_end, inst, places.get(), aggregates_pool);
     }
 }
 
@@ -1410,28 +1428,63 @@ void NO_INLINE Aggregator::executeWithoutKeyImpl(
                 continue;
 #endif
 
-        if (inst->offsets)
-            inst->batch_that->addBatchSinglePlace(
-                inst->offsets[static_cast<ssize_t>(row_begin) - 1],
-                inst->offsets[row_end - 1],
-                res + inst->state_offset,
-                inst->batch_arguments,
-                arena);
-        else if (inst->has_sparse_arguments)
-            inst->batch_that->addBatchSparseSinglePlace(
-                row_begin, row_end,
-                res + inst->state_offset,
-                inst->batch_arguments,
-                arena);
-        else
-            inst->batch_that->addBatchSinglePlace(
-                row_begin, row_end,
-                res + inst->state_offset,
-                inst->batch_arguments,
-                arena);
+        addBatchSinglePlace(row_begin, row_end, inst, res + inst->state_offset, arena);
     }
 }
 
+void Aggregator::addBatch(
+    size_t row_begin, size_t row_end,
+    AggregateFunctionInstruction * inst,
+    AggregateDataPtr * places,
+    Arena * arena)
+{
+    if (inst->offsets)
+        inst->batch_that->addBatchArray(
+            row_begin, row_end, places,
+            inst->state_offset,
+            inst->batch_arguments,
+            inst->offsets,
+            arena);
+    else if (inst->has_sparse_arguments)
+        inst->batch_that->addBatchSparse(
+            row_begin, row_end, places,
+            inst->state_offset,
+            inst->batch_arguments,
+            arena);
+    else
+        inst->batch_that->addBatch(
+            row_begin, row_end, places,
+            inst->state_offset,
+            inst->batch_arguments,
+            arena);
+}
+
+
+void Aggregator::addBatchSinglePlace(
+    size_t row_begin, size_t row_end,
+    AggregateFunctionInstruction * inst,
+    AggregateDataPtr place,
+    Arena * arena)
+{
+    if (inst->offsets)
+        inst->batch_that->addBatchSinglePlace(
+            inst->offsets[static_cast<ssize_t>(row_begin) - 1],
+            inst->offsets[row_end - 1],
+            place,
+            inst->batch_arguments,
+            arena);
+    else if (inst->has_sparse_arguments)
+        inst->batch_that->addBatchSparseSinglePlace(
+            row_begin, row_end, place,
+            inst->batch_arguments,
+            arena);
+    else
+        inst->batch_that->addBatchSinglePlace(
+            row_begin, row_end, place,
+            inst->batch_arguments,
+            arena);
+}
+
 
 void NO_INLINE Aggregator::executeOnIntervalWithoutKey(
     AggregatedDataVariants & data_variants, size_t row_begin, size_t row_end, AggregateFunctionInstruction * aggregate_instructions) const
@@ -1632,14 +1685,13 @@ bool Aggregator::executeOnBlock(Columns columns,
     /// For the case when there are no keys (all aggregate into one row).
     if (result.type == AggregatedDataVariants::Type::without_key)
     {
-        /// TODO: Enable compilation after investigation
-// #if USE_EMBEDDED_COMPILER
-//         if (compiled_aggregate_functions_holder)
-//         {
-//             executeWithoutKeyImpl<true>(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool);
-//         }
-//         else
-// #endif
+#if USE_EMBEDDED_COMPILER
+        if (compiled_aggregate_functions_holder && !hasSparseArguments(aggregate_functions_instructions.data()))
+        {
+            executeWithoutKeyImpl<true>(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool);
+        }
+        else
+#endif
         {
             executeWithoutKeyImpl<false>(result.without_key, row_begin, row_end, aggregate_functions_instructions.data(), result.aggregates_pool);
         }
@@ -2867,20 +2919,17 @@ ManyAggregatedDataVariants Aggregator::prepareVariantsToMerge(ManyAggregatedData
     return non_empty_data;
 }
 
-template <bool no_more_keys, typename Method, typename Table>
+template <bool no_more_keys, typename State, typename Table>
 void NO_INLINE Aggregator::mergeStreamsImplCase(
     Arena * aggregates_pool,
-    Method & method [[maybe_unused]],
+    State & state,
     Table & data,
     AggregateDataPtr overflow_row,
     size_t row_begin,
     size_t row_end,
     const AggregateColumnsConstData & aggregate_columns_data,
-    const ColumnRawPtrs & key_columns,
     Arena * arena_for_keys) const
 {
-    typename Method::State state(key_columns, key_sizes, aggregation_state_cache);
-
     std::unique_ptr<AggregateDataPtr[]> places(new AggregateDataPtr[row_end]);
 
     if (!arena_for_keys)
@@ -2890,7 +2939,7 @@ void NO_INLINE Aggregator::mergeStreamsImplCase(
     {
         AggregateDataPtr aggregate_data = nullptr;
 
-        if (!no_more_keys)
+        if constexpr (!no_more_keys)
         {
             auto emplace_result = state.emplaceKey(data, i, *arena_for_keys); // NOLINT
             if (emplace_result.isInserted())
@@ -2936,6 +2985,7 @@ void NO_INLINE Aggregator::mergeStreamsImpl(
     Method & method,
     Table & data,
     AggregateDataPtr overflow_row,
+    LastElementCacheStats & consecutive_keys_cache_stats,
     bool no_more_keys,
     Arena * arena_for_keys) const
 {
@@ -2943,15 +2993,17 @@ void NO_INLINE Aggregator::mergeStreamsImpl(
     const ColumnRawPtrs & key_columns = params.makeRawKeyColumns(block);
 
     mergeStreamsImpl<Method, Table>(
-        aggregates_pool, method, data, overflow_row, no_more_keys, 0, block.rows(), aggregate_columns_data, key_columns, arena_for_keys);
+        aggregates_pool, method, data, overflow_row, consecutive_keys_cache_stats,
+        no_more_keys, 0, block.rows(), aggregate_columns_data, key_columns, arena_for_keys);
 }
 
 template <typename Method, typename Table>
 void NO_INLINE Aggregator::mergeStreamsImpl(
     Arena * aggregates_pool,
-    Method & method,
+    Method & method [[maybe_unused]],
     Table & data,
     AggregateDataPtr overflow_row,
+    LastElementCacheStats & consecutive_keys_cache_stats,
     bool no_more_keys,
     size_t row_begin,
     size_t row_end,
@@ -2959,12 +3011,30 @@ void NO_INLINE Aggregator::mergeStreamsImpl(
     const ColumnRawPtrs & key_columns,
     Arena * arena_for_keys) const
 {
-    if (!no_more_keys)
-        mergeStreamsImplCase<false>(
-            aggregates_pool, method, data, overflow_row, row_begin, row_end, aggregate_columns_data, key_columns, arena_for_keys);
+    UInt64 total_rows = consecutive_keys_cache_stats.hits + consecutive_keys_cache_stats.misses;
+    double cache_hit_rate = total_rows ? static_cast<double>(consecutive_keys_cache_stats.hits) / total_rows : 1.0;
+    bool use_cache = cache_hit_rate >= params.min_hit_rate_to_use_consecutive_keys_optimization;
+
+    if (use_cache)
+    {
+        typename Method::State state(key_columns, key_sizes, aggregation_state_cache);
+
+        if (!no_more_keys)
+            mergeStreamsImplCase<false>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
+        else
+            mergeStreamsImplCase<true>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
+
+        consecutive_keys_cache_stats.update(row_end - row_begin, state.getCacheMissesSinceLastReset());
+    }
     else
-        mergeStreamsImplCase<true>(
-            aggregates_pool, method, data, overflow_row, row_begin, row_end, aggregate_columns_data, key_columns, arena_for_keys);
+    {
+        typename Method::StateNoCache state(key_columns, key_sizes, aggregation_state_cache);
+
+        if (!no_more_keys)
+            mergeStreamsImplCase<false>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
+        else
+            mergeStreamsImplCase<true>(aggregates_pool, state, data, overflow_row, row_begin, row_end, aggregate_columns_data, arena_for_keys);
+    }
 }
 
 
@@ -3024,7 +3094,7 @@ bool Aggregator::mergeOnBlock(Block block, AggregatedDataVariants & result, bool
         mergeBlockWithoutKeyStreamsImpl(std::move(block), result);
 #define M(NAME, IS_TWO_LEVEL) \
     else if (result.type == AggregatedDataVariants::Type::NAME) \
-        mergeStreamsImpl(std::move(block), result.aggregates_pool, *result.NAME, result.NAME->data, result.without_key, no_more_keys);
+        mergeStreamsImpl(std::move(block), result.aggregates_pool, *result.NAME, result.NAME->data, result.without_key, result.consecutive_keys_cache_stats, no_more_keys);
 
     APPLY_FOR_AGGREGATED_VARIANTS(M)
 #undef M
@@ -3127,9 +3197,11 @@ void Aggregator::mergeBlocks(BucketToBlocks bucket_to_blocks, AggregatedDataVari
 
             for (Block & block : bucket_to_blocks[bucket])
             {
+                /// Copy to avoid race.
+                auto consecutive_keys_cache_stats_copy = result.consecutive_keys_cache_stats;
             #define M(NAME) \
                 else if (result.type == AggregatedDataVariants::Type::NAME) \
-                    mergeStreamsImpl(std::move(block), aggregates_pool, *result.NAME, result.NAME->data.impls[bucket], nullptr, false);
+                    mergeStreamsImpl(std::move(block), aggregates_pool, *result.NAME, result.NAME->data.impls[bucket], nullptr, consecutive_keys_cache_stats_copy, false);
 
                 if (false) {} // NOLINT
                     APPLY_FOR_VARIANTS_TWO_LEVEL(M)
@@ -3184,7 +3256,7 @@ void Aggregator::mergeBlocks(BucketToBlocks bucket_to_blocks, AggregatedDataVari
 
         #define M(NAME, IS_TWO_LEVEL) \
             else if (result.type == AggregatedDataVariants::Type::NAME) \
-                mergeStreamsImpl(std::move(block), result.aggregates_pool, *result.NAME, result.NAME->data, result.without_key, no_more_keys);
+                mergeStreamsImpl(std::move(block), result.aggregates_pool, *result.NAME, result.NAME->data, result.without_key, result.consecutive_keys_cache_stats, no_more_keys);
 
             APPLY_FOR_AGGREGATED_VARIANTS(M)
         #undef M
@@ -3262,7 +3334,7 @@ Block Aggregator::mergeBlocks(BlocksList & blocks, bool final)
 
 #define M(NAME, IS_TWO_LEVEL) \
     else if (result.type == AggregatedDataVariants::Type::NAME) \
-        mergeStreamsImpl(std::move(block), result.aggregates_pool, *result.NAME, result.NAME->data, nullptr, false, arena_for_keys.get());
+        mergeStreamsImpl(std::move(block), result.aggregates_pool, *result.NAME, result.NAME->data, nullptr, result.consecutive_keys_cache_stats, false, arena_for_keys.get());
 
         APPLY_FOR_AGGREGATED_VARIANTS(M)
     #undef M
diff --git a/src/Interpreters/Aggregator.h b/src/Interpreters/Aggregator.h
index ab53f76d2ce..6fc3ac2f6d6 100644
--- a/src/Interpreters/Aggregator.h
+++ b/src/Interpreters/Aggregator.h
@@ -205,8 +205,17 @@ struct AggregationMethodOneNumber
     }
 
     /// To use one `Method` in different threads, use different `State`.
-    using State = ColumnsHashing::HashMethodOneNumber<typename Data::value_type,
-        Mapped, FieldType, consecutive_keys_optimization, false, nullable>;
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodOneNumber<
+        typename Data::value_type,
+        Mapped,
+        FieldType,
+        use_cache && consecutive_keys_optimization,
+        /*need_offset=*/ false,
+        nullable>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     /// Use optimization for low cardinality.
     static const bool low_cardinality_optimization = false;
@@ -259,7 +268,11 @@ struct AggregationMethodString
 
     explicit AggregationMethodString(size_t size_hint) : data(size_hint) { }
 
-    using State = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped>;
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped, /*place_string_to_arena=*/ true, use_cache>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     static const bool low_cardinality_optimization = false;
     static const bool one_key_nullable_optimization = false;
@@ -292,7 +305,11 @@ struct AggregationMethodStringNoCache
     {
     }
 
-    using State = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped, true, false, false, nullable>;
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodString<typename Data::value_type, Mapped, true, false, false, nullable>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     static const bool low_cardinality_optimization = false;
     static const bool one_key_nullable_optimization = nullable;
@@ -334,7 +351,11 @@ struct AggregationMethodFixedString
     {
     }
 
-    using State = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped>;
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped, /*place_string_to_arena=*/ true, use_cache>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     static const bool low_cardinality_optimization = false;
     static const bool one_key_nullable_optimization = false;
@@ -366,7 +387,11 @@ struct AggregationMethodFixedStringNoCache
     {
     }
 
-    using State = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped, true, false, false, nullable>;
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodFixedString<typename Data::value_type, Mapped, true, false, false, nullable>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     static const bool low_cardinality_optimization = false;
     static const bool one_key_nullable_optimization = nullable;
@@ -392,20 +417,24 @@ template <typename SingleColumnMethod>
 struct AggregationMethodSingleLowCardinalityColumn : public SingleColumnMethod
 {
     using Base = SingleColumnMethod;
-    using BaseState = typename Base::State;
-
     using Data = typename Base::Data;
     using Key = typename Base::Key;
     using Mapped = typename Base::Mapped;
-
     using Base::data;
 
+    template <bool use_cache>
+    using BaseStateImpl = typename Base::template StateImpl<use_cache>;
+
     AggregationMethodSingleLowCardinalityColumn() = default;
 
     template <typename Other>
     explicit AggregationMethodSingleLowCardinalityColumn(const Other & other) : Base(other) {}
 
-    using State = ColumnsHashing::HashMethodSingleLowCardinalityColumn<BaseState, Mapped, true>;
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodSingleLowCardinalityColumn<BaseStateImpl<use_cache>, Mapped, use_cache>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     static const bool low_cardinality_optimization = true;
 
@@ -429,7 +458,7 @@ struct AggregationMethodSingleLowCardinalityColumn : public SingleColumnMethod
 
 
 /// For the case where all keys are of fixed length, and they fit in N (for example, 128) bits.
-template <typename TData, bool has_nullable_keys_ = false, bool has_low_cardinality_ = false, bool use_cache = true>
+template <typename TData, bool has_nullable_keys_ = false, bool has_low_cardinality_ = false, bool consecutive_keys_optimization = false>
 struct AggregationMethodKeysFixed
 {
     using Data = TData;
@@ -449,13 +478,17 @@ struct AggregationMethodKeysFixed
     {
     }
 
-    using State = ColumnsHashing::HashMethodKeysFixed<
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodKeysFixed<
         typename Data::value_type,
         Key,
         Mapped,
         has_nullable_keys,
         has_low_cardinality,
-        use_cache>;
+        use_cache && consecutive_keys_optimization>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     static const bool low_cardinality_optimization = false;
     static const bool one_key_nullable_optimization = false;
@@ -546,7 +579,11 @@ struct AggregationMethodSerialized
     {
     }
 
-    using State = ColumnsHashing::HashMethodSerialized<typename Data::value_type, Mapped>;
+    template <bool use_cache>
+    using StateImpl = ColumnsHashing::HashMethodSerialized<typename Data::value_type, Mapped>;
+
+    using State = StateImpl<true>;
+    using StateNoCache = StateImpl<false>;
 
     static const bool low_cardinality_optimization = false;
     static const bool one_key_nullable_optimization = false;
@@ -566,6 +603,7 @@ class Aggregator;
 
 using ColumnsHashing::HashMethodContext;
 using ColumnsHashing::HashMethodContextPtr;
+using ColumnsHashing::LastElementCacheStats;
 
 struct AggregatedDataVariants : private boost::noncopyable
 {
@@ -599,6 +637,10 @@ struct AggregatedDataVariants : private boost::noncopyable
       */
     AggregatedDataWithoutKey without_key = nullptr;
 
+    /// Stats of a cache for consecutive keys optimization.
+    /// Stats can be used to disable the cache in case of a lot of misses.
+    LastElementCacheStats consecutive_keys_cache_stats;
+
     // Disable consecutive key optimization for Uint8/16, because they use a FixedHashMap
     // and the lookup there is almost free, so we don't need to cache the last lookup result
     std::unique_ptr<AggregationMethodOneNumber<UInt8, AggregatedDataWithUInt8Key, false>>           key8;
@@ -1025,6 +1067,8 @@ public:
 
         bool optimize_group_by_constant_keys;
 
+        const double min_hit_rate_to_use_consecutive_keys_optimization;
+
         struct StatsCollectingParams
         {
             StatsCollectingParams();
@@ -1042,6 +1086,7 @@ public:
             const size_t max_entries_for_hash_table_stats = 0;
             const size_t max_size_to_preallocate_for_aggregation = 0;
         };
+
         StatsCollectingParams stats_collecting_params;
 
         Params(
@@ -1063,7 +1108,8 @@ public:
             bool enable_prefetch_,
             bool only_merge_, // true for projections
             bool optimize_group_by_constant_keys_,
-            const StatsCollectingParams & stats_collecting_params_ = {})
+            double min_hit_rate_to_use_consecutive_keys_optimization_,
+            const StatsCollectingParams & stats_collecting_params_)
             : keys(keys_)
             , aggregates(aggregates_)
             , keys_size(keys.size())
@@ -1084,14 +1130,15 @@ public:
             , only_merge(only_merge_)
             , enable_prefetch(enable_prefetch_)
             , optimize_group_by_constant_keys(optimize_group_by_constant_keys_)
+            , min_hit_rate_to_use_consecutive_keys_optimization(min_hit_rate_to_use_consecutive_keys_optimization_)
             , stats_collecting_params(stats_collecting_params_)
         {
         }
 
         /// Only parameters that matter during merge.
-        Params(const Names & keys_, const AggregateDescriptions & aggregates_, bool overflow_row_, size_t max_threads_, size_t max_block_size_)
+        Params(const Names & keys_, const AggregateDescriptions & aggregates_, bool overflow_row_, size_t max_threads_, size_t max_block_size_, double min_hit_rate_to_use_consecutive_keys_optimization_)
             : Params(
-                keys_, aggregates_, overflow_row_, 0, OverflowMode::THROW, 0, 0, 0, false, nullptr, max_threads_, 0, false, 0, max_block_size_, false, true, {})
+                keys_, aggregates_, overflow_row_, 0, OverflowMode::THROW, 0, 0, 0, false, nullptr, max_threads_, 0, false, 0, max_block_size_, false, true, false, min_hit_rate_to_use_consecutive_keys_optimization_, {})
         {
         }
 
@@ -1295,15 +1342,28 @@ private:
         size_t row_end,
         ColumnRawPtrs & key_columns,
         AggregateFunctionInstruction * aggregate_instructions,
+        LastElementCacheStats & consecutive_keys_cache_stats,
+        bool no_more_keys,
+        bool all_keys_are_const,
+        AggregateDataPtr overflow_row) const;
+
+    template <typename Method, typename State>
+    void executeImpl(
+        Method & method,
+        State & state,
+        Arena * aggregates_pool,
+        size_t row_begin,
+        size_t row_end,
+        AggregateFunctionInstruction * aggregate_instructions,
         bool no_more_keys,
         bool all_keys_are_const,
         AggregateDataPtr overflow_row) const;
 
     /// Specialization for a particular value no_more_keys.
-    template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method>
+    template <bool no_more_keys, bool use_compiled_functions, bool prefetch, typename Method, typename State>
     void executeImplBatch(
         Method & method,
-        typename Method::State & state,
+        State & state,
         Arena * aggregates_pool,
         size_t row_begin,
         size_t row_end,
@@ -1413,16 +1473,15 @@ private:
         bool final,
         ThreadPool * thread_pool) const;
 
-    template <bool no_more_keys, typename Method, typename Table>
+    template <bool no_more_keys, typename State, typename Table>
     void mergeStreamsImplCase(
         Arena * aggregates_pool,
-        Method & method,
+        State & state,
         Table & data,
         AggregateDataPtr overflow_row,
         size_t row_begin,
         size_t row_end,
         const AggregateColumnsConstData & aggregate_columns_data,
-        const ColumnRawPtrs & key_columns,
         Arena * arena_for_keys) const;
 
     /// `arena_for_keys` used to store serialized aggregation keys (in methods like `serialized`) to save some space.
@@ -1434,6 +1493,7 @@ private:
         Method & method,
         Table & data,
         AggregateDataPtr overflow_row,
+        LastElementCacheStats & consecutive_keys_cache_stats,
         bool no_more_keys,
         Arena * arena_for_keys = nullptr) const;
 
@@ -1443,6 +1503,7 @@ private:
         Method & method,
         Table & data,
         AggregateDataPtr overflow_row,
+        LastElementCacheStats & consecutive_keys_cache_stats,
         bool no_more_keys,
         size_t row_begin,
         size_t row_end,
@@ -1453,6 +1514,7 @@ private:
     void mergeBlockWithoutKeyStreamsImpl(
         Block block,
         AggregatedDataVariants & result) const;
+
     void mergeWithoutKeyStreamsImpl(
         AggregatedDataVariants & result,
         size_t row_begin,
@@ -1507,6 +1569,18 @@ private:
         MutableColumns & final_key_columns) const;
 
     static bool hasSparseArguments(AggregateFunctionInstruction * aggregate_instructions);
+
+    static void addBatch(
+        size_t row_begin, size_t row_end,
+        AggregateFunctionInstruction * inst,
+        AggregateDataPtr * places,
+        Arena * arena);
+
+    static void addBatchSinglePlace(
+        size_t row_begin, size_t row_end,
+        AggregateFunctionInstruction * inst,
+        AggregateDataPtr place,
+        Arena * arena);
 };
 
 
diff --git a/src/Interpreters/AsynchronousInsertLog.cpp b/src/Interpreters/AsynchronousInsertLog.cpp
index 092862bb2b1..9f7d0176b45 100644
--- a/src/Interpreters/AsynchronousInsertLog.cpp
+++ b/src/Interpreters/AsynchronousInsertLog.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/AsynchronousInsertLog.h>
 
+#include <base/getFQDNOrHostName.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeDateTime64.h>
@@ -33,6 +34,7 @@ NamesAndTypesList AsynchronousInsertLogElement::getNamesAndTypes()
 
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"event_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
@@ -58,6 +60,7 @@ void AsynchronousInsertLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     auto event_date = DateLUT::instance().toDayNum(event_time).toUnderType();
     columns[i++]->insert(event_date);
     columns[i++]->insert(event_time);
diff --git a/src/Interpreters/AsynchronousInsertQueue.cpp b/src/Interpreters/AsynchronousInsertQueue.cpp
index a0750122a5c..63ee62cdef4 100644
--- a/src/Interpreters/AsynchronousInsertQueue.cpp
+++ b/src/Interpreters/AsynchronousInsertQueue.cpp
@@ -767,7 +767,6 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
     };
 
     StreamingFormatExecutor executor(header, format, std::move(on_error), std::move(adding_defaults_transform));
-    std::unique_ptr<ReadBuffer> last_buffer;
     auto chunk_info = std::make_shared<AsyncInsertInfo>();
     auto query_for_logging = serializeQuery(*key.query, insert_context->getSettingsRef().log_queries_cut_to_length);
 
@@ -783,11 +782,6 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
         auto buffer = std::make_unique<ReadBufferFromString>(*bytes);
         size_t num_bytes = bytes->size();
         size_t num_rows = executor.execute(*buffer);
-
-        /// Keep buffer, because it still can be used
-        /// in destructor, while resetting buffer at next iteration.
-        last_buffer = std::move(buffer);
-
         total_rows += num_rows;
         chunk_info->offsets.push_back(total_rows);
         chunk_info->tokens.push_back(entry->async_dedup_token);
@@ -796,8 +790,6 @@ Chunk AsynchronousInsertQueue::processEntriesWithParsing(
         current_exception.clear();
     }
 
-    format->addBuffer(std::move(last_buffer));
-
     Chunk chunk(executor.getResultColumns(), total_rows);
     chunk.setChunkInfo(std::move(chunk_info));
     return chunk;
diff --git a/src/Interpreters/AsynchronousMetricLog.cpp b/src/Interpreters/AsynchronousMetricLog.cpp
index eec5da802a7..a750388d38f 100644
--- a/src/Interpreters/AsynchronousMetricLog.cpp
+++ b/src/Interpreters/AsynchronousMetricLog.cpp
@@ -1,3 +1,4 @@
+#include <base/getFQDNOrHostName.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeDateTime64.h>
@@ -15,6 +16,7 @@ NamesAndTypesList AsynchronousMetricLogElement::getNamesAndTypes()
 {
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"metric", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
@@ -26,6 +28,7 @@ void AsynchronousMetricLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t column_idx = 0;
 
+    columns[column_idx++]->insert(getFQDNOrHostName());
     columns[column_idx++]->insert(event_date);
     columns[column_idx++]->insert(event_time);
     columns[column_idx++]->insert(metric_name);
diff --git a/src/Interpreters/AsynchronousMetricLog.h b/src/Interpreters/AsynchronousMetricLog.h
index 3b0ce1bee04..9a5266cee6e 100644
--- a/src/Interpreters/AsynchronousMetricLog.h
+++ b/src/Interpreters/AsynchronousMetricLog.h
@@ -34,7 +34,8 @@ struct AsynchronousMetricLogElement
     /// Otherwise the list will be constructed from LogElement::getNamesAndTypes and LogElement::getNamesAndAliases.
     static const char * getCustomColumnList()
     {
-        return "event_date Date CODEC(Delta(2), ZSTD(1)), "
+        return "hostname LowCardinality(String) CODEC(ZSTD(1)), "
+               "event_date Date CODEC(Delta(2), ZSTD(1)), "
                "event_time DateTime CODEC(Delta(4), ZSTD(1)), "
                "metric LowCardinality(String) CODEC(ZSTD(1)), "
                "value Float64 CODEC(ZSTD(3))";
diff --git a/src/Interpreters/BackupLog.cpp b/src/Interpreters/BackupLog.cpp
index 5e6c038ac5d..e49bb28bd45 100644
--- a/src/Interpreters/BackupLog.cpp
+++ b/src/Interpreters/BackupLog.cpp
@@ -1,8 +1,10 @@
 #include <Interpreters/BackupLog.h>
 
+#include <base/getFQDNOrHostName.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/DataTypeEnum.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 
@@ -20,10 +22,12 @@ NamesAndTypesList BackupLogElement::getNamesAndTypes()
 {
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
         {"id", std::make_shared<DataTypeString>()},
         {"name", std::make_shared<DataTypeString>()},
+        {"base_backup_name", std::make_shared<DataTypeString>()},
         {"status", std::make_shared<DataTypeEnum8>(getBackupStatusEnumValues())},
         {"error", std::make_shared<DataTypeString>()},
         {"start_time", std::make_shared<DataTypeDateTime>()},
@@ -41,10 +45,12 @@ NamesAndTypesList BackupLogElement::getNamesAndTypes()
 void BackupLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(std::chrono::system_clock::to_time_t(event_time)).toUnderType());
     columns[i++]->insert(event_time_usec);
     columns[i++]->insert(info.id);
     columns[i++]->insert(info.name);
+    columns[i++]->insert(info.base_backup_name);
     columns[i++]->insert(static_cast<Int8>(info.status));
     columns[i++]->insert(info.error_message);
     columns[i++]->insert(static_cast<UInt32>(std::chrono::system_clock::to_time_t(info.start_time)));
diff --git a/src/Interpreters/Cache/EvictionCandidates.cpp b/src/Interpreters/Cache/EvictionCandidates.cpp
new file mode 100644
index 00000000000..7dceab4f95f
--- /dev/null
+++ b/src/Interpreters/Cache/EvictionCandidates.cpp
@@ -0,0 +1,72 @@
+#include <Interpreters/Cache/EvictionCandidates.h>
+#include <Interpreters/Cache/Metadata.h>
+
+
+namespace ProfileEvents
+{
+    extern const Event FilesystemCacheEvictMicroseconds;
+    extern const Event FilesystemCacheEvictedBytes;
+    extern const Event FilesystemCacheEvictedFileSegments;
+}
+
+namespace DB
+{
+
+EvictionCandidates::~EvictionCandidates()
+{
+    for (const auto & [key, key_candidates] : candidates)
+    {
+        for (const auto & candidate : key_candidates.candidates)
+            candidate->removal_candidate = false;
+    }
+}
+
+void EvictionCandidates::add(LockedKey & locked_key, const FileSegmentMetadataPtr & candidate)
+{
+    auto [it, inserted] = candidates.emplace(locked_key.getKey(), KeyCandidates{});
+    if (inserted)
+        it->second.key_metadata = locked_key.getKeyMetadata();
+    it->second.candidates.push_back(candidate);
+
+    candidate->removal_candidate = true;
+    ++candidates_size;
+}
+
+void EvictionCandidates::evict(FileCacheQueryLimit::QueryContext * query_context, const CacheGuard::Lock & lock)
+{
+    if (candidates.empty())
+        return;
+
+    auto timer = DB::CurrentThread::getProfileEvents().timer(ProfileEvents::FilesystemCacheEvictMicroseconds);
+
+    for (auto & [key, key_candidates] : candidates)
+    {
+        auto locked_key = key_candidates.key_metadata->tryLock();
+        if (!locked_key)
+            continue; /// key could become invalid after we released the key lock above, just skip it.
+
+        auto & to_evict = key_candidates.candidates;
+        while (!to_evict.empty())
+        {
+            auto & candidate = to_evict.back();
+            chassert(candidate->releasable());
+
+            const auto segment = candidate->file_segment;
+            auto queue_it = segment->getQueueIterator();
+            chassert(queue_it);
+
+            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedFileSegments);
+            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedBytes, segment->range().size());
+
+            locked_key->removeFileSegment(segment->offset(), segment->lock());
+            queue_it->remove(lock);
+
+            if (query_context)
+                query_context->remove(segment->key(), segment->offset(), lock);
+
+            to_evict.pop_back();
+        }
+    }
+}
+
+}
diff --git a/src/Interpreters/Cache/EvictionCandidates.h b/src/Interpreters/Cache/EvictionCandidates.h
new file mode 100644
index 00000000000..0557962d97f
--- /dev/null
+++ b/src/Interpreters/Cache/EvictionCandidates.h
@@ -0,0 +1,35 @@
+#pragma once
+#include <Interpreters/Cache/QueryLimit.h>
+
+namespace DB
+{
+
+class EvictionCandidates
+{
+public:
+    ~EvictionCandidates();
+
+    void add(LockedKey & locked_key, const FileSegmentMetadataPtr & candidate);
+
+    void evict(FileCacheQueryLimit::QueryContext * query_context, const CacheGuard::Lock &);
+
+    size_t size() const { return candidates_size; }
+
+    auto begin() const { return candidates.begin(); }
+
+    auto end() const { return candidates.end(); }
+
+private:
+    struct KeyCandidates
+    {
+        KeyMetadataPtr key_metadata;
+        std::vector<FileSegmentMetadataPtr> candidates;
+    };
+
+    std::unordered_map<FileCacheKey, KeyCandidates> candidates;
+    size_t candidates_size = 0;
+};
+
+using EvictionCandidatesPtr = std::unique_ptr<EvictionCandidates>;
+
+}
diff --git a/src/Interpreters/Cache/FileCache.cpp b/src/Interpreters/Cache/FileCache.cpp
index acb9492b65e..6b627cb07b3 100644
--- a/src/Interpreters/Cache/FileCache.cpp
+++ b/src/Interpreters/Cache/FileCache.cpp
@@ -7,6 +7,8 @@
 #include <IO/WriteBufferFromString.h>
 #include <Interpreters/Cache/FileCacheSettings.h>
 #include <Interpreters/Cache/LRUFileCachePriority.h>
+#include <Interpreters/Cache/SLRUFileCachePriority.h>
+#include <Interpreters/Cache/EvictionCandidates.h>
 #include <Interpreters/Context.h>
 #include <base/hex.h>
 #include <Common/ThreadPool.h>
@@ -20,13 +22,8 @@ namespace fs = std::filesystem;
 namespace ProfileEvents
 {
     extern const Event FilesystemCacheLoadMetadataMicroseconds;
-    extern const Event FilesystemCacheEvictedBytes;
-    extern const Event FilesystemCacheEvictedFileSegments;
-    extern const Event FilesystemCacheEvictionSkippedFileSegments;
-    extern const Event FilesystemCacheEvictionTries;
     extern const Event FilesystemCacheLockCacheMicroseconds;
     extern const Event FilesystemCacheReserveMicroseconds;
-    extern const Event FilesystemCacheEvictMicroseconds;
     extern const Event FilesystemCacheGetOrSetMicroseconds;
     extern const Event FilesystemCacheGetMicroseconds;
 }
@@ -51,18 +48,46 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
+    extern const int BAD_ARGUMENTS;
+}
+
+void FileCacheReserveStat::update(size_t size, FileSegmentKind kind, bool releasable)
+{
+    auto & local_stat = stat_by_kind[kind];
+    if (releasable)
+    {
+        stat.releasable_size += size;
+        ++stat.releasable_count;
+
+        local_stat.releasable_size += size;
+        ++local_stat.releasable_count;
+    }
+    else
+    {
+        stat.non_releasable_size += size;
+        ++stat.non_releasable_count;
+
+        local_stat.non_releasable_size += size;
+        ++local_stat.non_releasable_count;
+    }
 }
 
 FileCache::FileCache(const std::string & cache_name, const FileCacheSettings & settings)
     : max_file_segment_size(settings.max_file_segment_size)
     , bypass_cache_threshold(settings.enable_bypass_cache_with_threshold ? settings.bypass_cache_threshold : 0)
     , boundary_alignment(settings.boundary_alignment)
-    , background_download_threads(settings.background_download_threads)
-    , metadata_download_threads(settings.load_metadata_threads)
+    , load_metadata_threads(settings.load_metadata_threads)
     , log(&Poco::Logger::get("FileCache(" + cache_name + ")"))
-    , metadata(settings.base_path, settings.background_download_queue_size_limit)
+    , metadata(settings.base_path, settings.background_download_queue_size_limit, settings.background_download_threads)
 {
-    main_priority = std::make_unique<LRUFileCachePriority>(settings.max_size, settings.max_elements);
+    if (settings.cache_policy == "LRU")
+        main_priority = std::make_unique<LRUFileCachePriority>(settings.max_size, settings.max_elements);
+    else if (settings.cache_policy == "SLRU")
+        main_priority = std::make_unique<SLRUFileCachePriority>(settings.max_size, settings.max_elements, settings.slru_size_ratio);
+    else
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unknown cache policy: {}", settings.cache_policy);
+
+    LOG_DEBUG(log, "Using {} cache policy", settings.cache_policy);
 
     if (settings.cache_hits_threshold)
         stash = std::make_unique<HitsCountStash>(settings.cache_hits_threshold, settings.max_elements);
@@ -133,12 +158,8 @@ void FileCache::initialize()
         throw;
     }
 
+    metadata.startup();
     is_initialized = true;
-
-    for (size_t i = 0; i < background_download_threads; ++i)
-         download_threads.emplace_back([this] { metadata.downloadThreadFunc(); });
-
-    cleanup_thread = std::make_unique<ThreadFromGlobalPool>(std::function{ [this]{ metadata.cleanupThreadFunc(); }});
 }
 
 CacheGuard::Lock FileCache::lockCache() const
@@ -273,7 +294,7 @@ FileSegments FileCache::splitRangeIntoFileSegments(
     size_t size,
     FileSegment::State state,
     size_t file_segments_limit,
-    const CreateFileSegmentSettings & settings)
+    const CreateFileSegmentSettings & create_settings)
 {
     assert(size > 0);
 
@@ -290,7 +311,7 @@ FileSegments FileCache::splitRangeIntoFileSegments(
         remaining_size -= current_file_segment_size;
 
         auto file_segment_metadata_it = addFileSegment(
-            locked_key, current_pos, current_file_segment_size, state, settings, nullptr);
+            locked_key, current_pos, current_file_segment_size, state, create_settings, nullptr);
         file_segments.push_back(file_segment_metadata_it->second->file_segment);
 
         current_pos += current_file_segment_size;
@@ -305,7 +326,7 @@ void FileCache::fillHolesWithEmptyFileSegments(
     const FileSegment::Range & range,
     size_t file_segments_limit,
     bool fill_with_detached_file_segments,
-    const CreateFileSegmentSettings & settings)
+    const CreateFileSegmentSettings & create_settings)
 {
     /// There are segments [segment1, ..., segmentN]
     /// (non-overlapping, non-empty, ascending-ordered) which (maybe partially)
@@ -362,7 +383,7 @@ void FileCache::fillHolesWithEmptyFileSegments(
         if (fill_with_detached_file_segments)
         {
             auto file_segment = std::make_shared<FileSegment>(
-                locked_key.getKey(), current_pos, hole_size, FileSegment::State::DETACHED, settings);
+                locked_key.getKey(), current_pos, hole_size, FileSegment::State::DETACHED, create_settings);
 
             file_segments.insert(it, file_segment);
             ++processed_count;
@@ -373,7 +394,7 @@ void FileCache::fillHolesWithEmptyFileSegments(
             FileSegments hole;
             for (const auto & r : ranges)
             {
-                auto metadata_it = addFileSegment(locked_key, r.left, r.size(), FileSegment::State::EMPTY, settings, nullptr);
+                auto metadata_it = addFileSegment(locked_key, r.left, r.size(), FileSegment::State::EMPTY, create_settings, nullptr);
                 hole.push_back(metadata_it->second->file_segment);
                 ++processed_count;
 
@@ -418,7 +439,7 @@ void FileCache::fillHolesWithEmptyFileSegments(
         if (fill_with_detached_file_segments)
         {
             auto file_segment = std::make_shared<FileSegment>(
-                locked_key.getKey(), current_pos, hole_size, FileSegment::State::DETACHED, settings);
+                locked_key.getKey(), current_pos, hole_size, FileSegment::State::DETACHED, create_settings);
 
             file_segments.insert(file_segments.end(), file_segment);
         }
@@ -428,7 +449,7 @@ void FileCache::fillHolesWithEmptyFileSegments(
             FileSegments hole;
             for (const auto & r : ranges)
             {
-                auto metadata_it = addFileSegment(locked_key, r.left, r.size(), FileSegment::State::EMPTY, settings, nullptr);
+                auto metadata_it = addFileSegment(locked_key, r.left, r.size(), FileSegment::State::EMPTY, create_settings, nullptr);
                 hole.push_back(metadata_it->second->file_segment);
                 ++processed_count;
 
@@ -447,7 +468,7 @@ FileSegmentsHolderPtr FileCache::set(
     const Key & key,
     size_t offset,
     size_t size,
-    const CreateFileSegmentSettings & settings)
+    const CreateFileSegmentSettings & create_settings)
 {
     assertInitialized();
 
@@ -458,17 +479,17 @@ FileSegmentsHolderPtr FileCache::set(
     if (!file_segments.empty())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Having intersection with already existing cache");
 
-    if (settings.unbounded)
+    if (create_settings.unbounded)
     {
         /// If the file is unbounded, we can create a single file_segment_metadata for it.
         auto file_segment_metadata_it = addFileSegment(
-            *locked_key, offset, size, FileSegment::State::EMPTY, settings, nullptr);
+            *locked_key, offset, size, FileSegment::State::EMPTY, create_settings, nullptr);
         file_segments = {file_segment_metadata_it->second->file_segment};
     }
     else
     {
         file_segments = splitRangeIntoFileSegments(
-            *locked_key, offset, size, FileSegment::State::EMPTY, /* file_segments_limit */0, settings);
+            *locked_key, offset, size, FileSegment::State::EMPTY, /* file_segments_limit */0, create_settings);
     }
 
     return std::make_unique<FileSegmentsHolder>(std::move(file_segments));
@@ -480,7 +501,7 @@ FileCache::getOrSet(
     size_t offset,
     size_t size,
     size_t file_size,
-    const CreateFileSegmentSettings & settings,
+    const CreateFileSegmentSettings & create_settings,
     size_t file_segments_limit)
 {
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FilesystemCacheGetOrSetMicroseconds);
@@ -586,7 +607,7 @@ FileCache::getOrSet(
 
     if (file_segments.empty())
     {
-        file_segments = splitRangeIntoFileSegments(*locked_key, range.left, range.size(), FileSegment::State::EMPTY, file_segments_limit, settings);
+        file_segments = splitRangeIntoFileSegments(*locked_key, range.left, range.size(), FileSegment::State::EMPTY, file_segments_limit, create_settings);
     }
     else
     {
@@ -594,7 +615,7 @@ FileCache::getOrSet(
         chassert(file_segments.back()->range().left <= range.right);
 
         fillHolesWithEmptyFileSegments(
-            *locked_key, file_segments, range, file_segments_limit, /* fill_with_detached */false, settings);
+            *locked_key, file_segments, range, file_segments_limit, /* fill_with_detached */false, create_settings);
 
         if (!file_segments.front()->range().contains(offset))
         {
@@ -649,7 +670,7 @@ KeyMetadata::iterator FileCache::addFileSegment(
     size_t offset,
     size_t size,
     FileSegment::State state,
-    const CreateFileSegmentSettings & settings,
+    const CreateFileSegmentSettings & create_settings,
     const CacheGuard::Lock * lock)
 {
     /// Create a file_segment_metadata and put it in `files` map by [key][offset].
@@ -686,14 +707,14 @@ KeyMetadata::iterator FileCache::addFileSegment(
             stash_records.emplace(
                 stash_key, stash->queue->add(locked_key.getKeyMetadata(), offset, 0, *lock));
 
-            if (stash->queue->getElementsCount(*lock) > stash->queue->getElementsLimit())
+            if (stash->queue->getElementsCount(*lock) > stash->queue->getElementsLimit(*lock))
                 stash->queue->pop(*lock);
 
             result_state = FileSegment::State::DETACHED;
         }
         else
         {
-            result_state = record_it->second->use(*lock) >= stash->hits_threshold
+            result_state = record_it->second->increasePriority(*lock) >= stash->hits_threshold
                 ? FileSegment::State::EMPTY
                 : FileSegment::State::DETACHED;
         }
@@ -703,7 +724,7 @@ KeyMetadata::iterator FileCache::addFileSegment(
         result_state = state;
     }
 
-    auto file_segment = std::make_shared<FileSegment>(key, offset, size, result_state, settings, background_download_threads > 0, this, locked_key.getKeyMetadata());
+    auto file_segment = std::make_shared<FileSegment>(key, offset, size, result_state, create_settings, metadata.isBackgroundDownloadEnabled(), this, locked_key.getKeyMetadata());
     auto file_segment_metadata = std::make_shared<FileSegmentMetadata>(std::move(file_segment));
 
     auto [file_segment_metadata_it, inserted] = locked_key.emplace(offset, file_segment_metadata);
@@ -727,7 +748,7 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size, FileCa
     LOG_TEST(
         log, "Trying to reserve space ({} bytes) for {}:{}, current usage {}/{}",
         size, file_segment.key(), file_segment.offset(),
-        main_priority->getSize(cache_lock), main_priority->getSizeLimit());
+        main_priority->getSize(cache_lock), main_priority->getSizeLimit(cache_lock));
 
     /// In case of per query cache limit (by default disabled), we add/remove entries from both
     /// (main_priority and query_priority) priority queues, but iterate entries in order of query_priority,
@@ -739,7 +760,7 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size, FileCa
     {
         query_priority = &query_context->getPriority();
 
-        const bool query_limit_exceeded = query_priority->getSize(cache_lock) + size > query_priority->getSizeLimit();
+        const bool query_limit_exceeded = query_priority->getSize(cache_lock) + size > query_priority->getSizeLimit(cache_lock);
         if (query_limit_exceeded && !query_context->recacheOnFileCacheQueryLimitExceeded())
         {
             LOG_TEST(log, "Query limit exceeded, space reservation failed, "
@@ -750,181 +771,38 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size, FileCa
 
         LOG_TEST(
             log, "Using query limit, current usage: {}/{} (while reserving for {}:{})",
-            query_priority->getSize(cache_lock), query_priority->getSizeLimit(),
+            query_priority->getSize(cache_lock), query_priority->getSizeLimit(cache_lock),
             file_segment.key(), file_segment.offset());
     }
 
-    struct EvictionCandidates
-    {
-        explicit EvictionCandidates(KeyMetadataPtr key_metadata_) : key_metadata(std::move(key_metadata_)) {}
-
-        void add(const FileSegmentMetadataPtr & candidate)
-        {
-            candidate->removal_candidate = true;
-            candidates.push_back(candidate);
-        }
-
-        ~EvictionCandidates()
-        {
-            /// If failed to reserve space, we don't delete the candidates but drop the flag instead
-            /// so the segments can be used again
-            for (const auto & candidate : candidates)
-                candidate->removal_candidate = false;
-        }
-
-        KeyMetadataPtr key_metadata;
-        std::vector<FileSegmentMetadataPtr> candidates;
-    };
-
-    std::unordered_map<Key, EvictionCandidates> to_delete;
-    size_t freeable_space = 0, freeable_count = 0;
-
-    auto iterate_func = [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
-    {
-        chassert(segment_metadata->file_segment->assertCorrectness());
-
-        auto & stat_by_kind = reserve_stat.stat_by_kind[segment_metadata->file_segment->getKind()];
-        if (segment_metadata->releasable())
-        {
-            const auto & key = segment_metadata->file_segment->key();
-            auto it = to_delete.find(key);
-            if (it == to_delete.end())
-                it = to_delete.emplace(key, locked_key.getKeyMetadata()).first;
-            it->second.add(segment_metadata);
-
-            stat_by_kind.releasable_size += segment_metadata->size();
-            ++stat_by_kind.releasable_count;
-
-            freeable_space += segment_metadata->size();
-            ++freeable_count;
-        }
-        else
-        {
-            stat_by_kind.non_releasable_size += segment_metadata->size();
-            ++stat_by_kind.non_releasable_count;
-
-            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictionSkippedFileSegments);
-        }
-
-        return PriorityIterationResult::CONTINUE;
-    };
+    EvictionCandidates eviction_candidates;
+    IFileCachePriority::FinalizeEvictionFunc finalize_eviction_func;
 
     if (query_priority)
     {
-        auto is_query_priority_overflow = [&]
-        {
-            const size_t new_size = query_priority->getSize(cache_lock) + size - freeable_space;
-            return new_size > query_priority->getSizeLimit();
-        };
-
-        if (is_query_priority_overflow())
-        {
-            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictionTries);
-
-            query_priority->iterate(
-                [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
-                { return is_query_priority_overflow() ? iterate_func(locked_key, segment_metadata) : PriorityIterationResult::BREAK; },
-                cache_lock);
-
-            if (is_query_priority_overflow())
-                return false;
-        }
-
-        LOG_TEST(
-            log, "Query limits satisfied (while reserving for {}:{})",
-            file_segment.key(), file_segment.offset());
-    }
-
-    auto is_main_priority_overflow = [main_priority_size_limit = main_priority->getSizeLimit(),
-                                      main_priority_elements_limit = main_priority->getElementsLimit(),
-                                      size,
-                                      &freeable_space,
-                                      &freeable_count,
-                                      &file_segment,
-                                      &cache_lock,
-                                      my_main_priority = this->main_priority.get(),
-                                      my_log = this->log]
-    {
-        const bool is_overflow =
-            /// size_limit == 0 means unlimited cache size
-            (main_priority_size_limit != 0 && (my_main_priority->getSize(cache_lock) + size - freeable_space > main_priority_size_limit))
-            /// elements_limit == 0 means unlimited number of cache elements
-            || (main_priority_elements_limit != 0 && freeable_count == 0
-                && my_main_priority->getElementsCount(cache_lock) == main_priority_elements_limit);
-
-        LOG_TEST(
-            my_log, "Overflow: {}, size: {}, ready to remove: {} ({} in number), current cache size: {}/{}, elements: {}/{}, while reserving for {}:{}",
-            is_overflow, size, freeable_space, freeable_count,
-            my_main_priority->getSize(cache_lock), my_main_priority->getSizeLimit(),
-            my_main_priority->getElementsCount(cache_lock), my_main_priority->getElementsLimit(),
-            file_segment.key(), file_segment.offset());
-
-        return is_overflow;
-    };
-
-    /// If we have enough space in query_priority, we are not interested about stat there anymore.
-    /// Clean the stat before iterating main_priority to avoid calculating any segment stat twice.
-    reserve_stat.stat_by_kind.clear();
-
-    if (is_main_priority_overflow())
-    {
-        ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictionTries);
-
-        main_priority->iterate(
-            [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
-            { return is_main_priority_overflow() ? iterate_func(locked_key, segment_metadata) : PriorityIterationResult::BREAK; },
-            cache_lock);
-
-        if (is_main_priority_overflow())
+        if (!query_priority->collectCandidatesForEviction(size, reserve_stat, eviction_candidates, {}, finalize_eviction_func, cache_lock))
             return false;
+
+        LOG_TEST(log, "Query limits satisfied (while reserving for {}:{})", file_segment.key(), file_segment.offset());
+        /// If we have enough space in query_priority, we are not interested about stat there anymore.
+        /// Clean the stat before iterating main_priority to avoid calculating any segment stat twice.
+        reserve_stat.stat_by_kind.clear();
     }
 
+    /// A file_segment_metadata acquires a priority iterator on first successful space reservation attempt,
+    auto queue_iterator = file_segment.getQueueIterator();
+    chassert(!queue_iterator || file_segment.getReservedSize() > 0);
+
+    if (!main_priority->collectCandidatesForEviction(size, reserve_stat, eviction_candidates, queue_iterator, finalize_eviction_func, cache_lock))
+        return false;
+
     if (!file_segment.getKeyMetadata()->createBaseDirectory())
         return false;
 
-    if (!to_delete.empty())
-    {
-        LOG_DEBUG(
-            log, "Will evict {} file segments (while reserving {} bytes for {}:{})",
-            to_delete.size(), size, file_segment.key(), file_segment.offset());
+    eviction_candidates.evict(query_context.get(), cache_lock);
 
-        ProfileEventTimeIncrement<Microseconds> evict_watch(ProfileEvents::FilesystemCacheEvictMicroseconds);
-
-        for (auto & [current_key, deletion_info] : to_delete)
-        {
-            auto locked_key = deletion_info.key_metadata->tryLock();
-            if (!locked_key)
-                continue; /// key could become invalid after we released the key lock above, just skip it.
-
-            /// delete from vector in reverse order just for efficiency
-            auto & candidates = deletion_info.candidates;
-            while (!candidates.empty())
-            {
-                auto & candidate = candidates.back();
-                chassert(candidate->releasable());
-
-                const auto * segment = candidate->file_segment.get();
-                auto queue_it = segment->getQueueIterator();
-                chassert(queue_it);
-
-                ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedFileSegments);
-                ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedBytes, segment->range().size());
-
-                locked_key->removeFileSegment(segment->offset(), segment->lock());
-                queue_it->remove(cache_lock);
-
-                if (query_context)
-                    query_context->remove(current_key, segment->offset(), cache_lock);
-
-                candidates.pop_back();
-            }
-        }
-    }
-
-    /// A file_segment_metadata acquires a LRUQueue iterator on first successful space reservation attempt,
-    /// e.g. queue_iteratir is std::nullopt here if no space has been reserved yet.
-    auto queue_iterator = file_segment.getQueueIterator();
-    chassert(!queue_iterator || file_segment.getReservedSize() > 0);
+    if (finalize_eviction_func)
+        finalize_eviction_func(cache_lock);
 
     if (queue_iterator)
     {
@@ -956,6 +834,15 @@ bool FileCache::tryReserve(FileSegment & file_segment, const size_t size, FileCa
     return true;
 }
 
+void FileCache::iterate(IterateFunc && func)
+{
+    return metadata.iterate([&](const LockedKey & locked_key)
+    {
+        for (const auto & file_segment_metadata : locked_key)
+            func(FileSegment::getInfo(file_segment_metadata.second->file_segment));
+    });
+}
+
 void FileCache::removeKey(const Key & key)
 {
     assertInitialized();
@@ -994,8 +881,7 @@ void FileCache::removeAllReleasable()
     {
         /// Remove all access information.
         auto lock = lockCache();
-        stash->records.clear();
-        stash->queue->removeAll(lock);
+        stash->clear();
     }
 }
 
@@ -1051,9 +937,9 @@ void FileCache::loadMetadataImpl()
     std::mutex set_exception_mutex;
     std::atomic<bool> stop_loading = false;
 
-    LOG_INFO(log, "Loading filesystem cache with {} threads", metadata_download_threads);
+    LOG_INFO(log, "Loading filesystem cache with {} threads", load_metadata_threads);
 
-    for (size_t i = 0; i < metadata_download_threads; ++i)
+    for (size_t i = 0; i < load_metadata_threads; ++i)
     {
         try
         {
@@ -1140,9 +1026,6 @@ void FileCache::loadMetadataForKeys(const fs::path & keys_dir)
         const auto key = Key::fromKeyString(key_directory.filename().string());
         auto key_metadata = metadata.getKeyMetadata(key, CacheMetadata::KeyNotFoundPolicy::CREATE_EMPTY, /* is_initial_load */true);
 
-        const size_t size_limit = main_priority->getSizeLimit();
-        const size_t elements_limit = main_priority->getElementsLimit();
-
         for (fs::directory_iterator offset_it{key_directory}; offset_it != fs::directory_iterator(); ++offset_it)
         {
             auto offset_with_suffix = offset_it->path().filename().string();
@@ -1182,14 +1065,16 @@ void FileCache::loadMetadataForKeys(const fs::path & keys_dir)
             }
 
             bool limits_satisfied;
-            IFileCachePriority::Iterator cache_it;
+            IFileCachePriority::IteratorPtr cache_it;
+            size_t size_limit = 0;
+
             {
                 auto lock = lockCache();
-                limits_satisfied = (size_limit == 0 || main_priority->getSize(lock) + size <= size_limit)
-                    && (elements_limit == 0 || main_priority->getElementsCount(lock) + 1 <= elements_limit);
+                size_limit = main_priority->getSizeLimit(lock);
 
+                limits_satisfied = main_priority->canFit(size, lock);
                 if (limits_satisfied)
-                    cache_it = main_priority->add(key_metadata, offset, size, lock);
+                    cache_it = main_priority->add(key_metadata, offset, size, lock, /* is_startup */true);
 
                 /// TODO: we can get rid of this lockCache() if we first load everything in parallel
                 /// without any mutual lock between loading threads, and only after do removeOverflow().
@@ -1235,7 +1120,7 @@ void FileCache::loadMetadataForKeys(const fs::path & keys_dir)
                     log,
                     "Cache capacity changed (max size: {}), "
                     "cached file `{}` does not fit in cache anymore (size: {})",
-                    main_priority->getSizeLimit(), offset_it->path().string(), size);
+                    size_limit, offset_it->path().string(), size);
 
                 fs::remove(offset_it->path());
             }
@@ -1258,54 +1143,39 @@ FileCache::~FileCache()
 
 void FileCache::deactivateBackgroundOperations()
 {
-    metadata.cancelDownload();
-    metadata.cancelCleanup();
-
-    for (auto & thread : download_threads)
-        if (thread.joinable())
-            thread.join();
-
-    if (cleanup_thread && cleanup_thread->joinable())
-        cleanup_thread->join();
+    shutdown.store(true);
+    metadata.shutdown();
 }
 
-FileSegments FileCache::getSnapshot()
+std::vector<FileSegment::Info> FileCache::getFileSegmentInfos()
 {
     assertInitialized();
 #ifndef NDEBUG
     assertCacheCorrectness();
 #endif
 
-    FileSegments file_segments;
+    std::vector<FileSegment::Info> file_segments;
     metadata.iterate([&](const LockedKey & locked_key)
     {
         for (const auto & [_, file_segment_metadata] : locked_key)
-            file_segments.push_back(FileSegment::getSnapshot(file_segment_metadata->file_segment));
+            file_segments.push_back(FileSegment::getInfo(file_segment_metadata->file_segment));
     });
     return file_segments;
 }
 
-FileSegments FileCache::getSnapshot(const Key & key)
+std::vector<FileSegment::Info> FileCache::getFileSegmentInfos(const Key & key)
 {
-    FileSegments file_segments;
+    std::vector<FileSegment::Info> file_segments;
     auto locked_key = metadata.lockKeyMetadata(key, CacheMetadata::KeyNotFoundPolicy::THROW_LOGICAL);
     for (const auto & [_, file_segment_metadata] : *locked_key)
-        file_segments.push_back(FileSegment::getSnapshot(file_segment_metadata->file_segment));
+        file_segments.push_back(FileSegment::getInfo(file_segment_metadata->file_segment));
     return file_segments;
 }
 
-FileSegments FileCache::dumpQueue()
+std::vector<FileSegment::Info> FileCache::dumpQueue()
 {
     assertInitialized();
-
-    FileSegments file_segments;
-    main_priority->iterate([&](LockedKey &, const FileSegmentMetadataPtr & segment_metadata)
-    {
-        file_segments.push_back(FileSegment::getSnapshot(segment_metadata->file_segment));
-        return PriorityIterationResult::CONTINUE;
-    }, lockCache());
-
-    return file_segments;
+    return main_priority->dump(lockCache());
 }
 
 std::vector<String> FileCache::tryGetCachePaths(const Key & key)
@@ -1342,13 +1212,82 @@ void FileCache::assertCacheCorrectness()
     {
         for (const auto & [_, file_segment_metadata] : locked_key)
         {
-            const auto & file_segment = *file_segment_metadata->file_segment;
-            UNUSED(file_segment);
-            chassert(file_segment.assertCorrectness());
+            chassert(file_segment_metadata->file_segment->assertCorrectness());
         }
     });
 }
 
+void FileCache::applySettingsIfPossible(const FileCacheSettings & new_settings, FileCacheSettings & actual_settings)
+{
+    if (!is_initialized || shutdown || new_settings == actual_settings)
+        return;
+
+    std::lock_guard lock(apply_settings_mutex);
+
+    if (new_settings.background_download_queue_size_limit != actual_settings.background_download_queue_size_limit
+        && metadata.setBackgroundDownloadQueueSizeLimit(new_settings.background_download_queue_size_limit))
+    {
+        LOG_INFO(log, "Changed background_download_queue_size from {} to {}",
+                 actual_settings.background_download_queue_size_limit,
+                 new_settings.background_download_queue_size_limit);
+
+        actual_settings.background_download_queue_size_limit = new_settings.background_download_queue_size_limit;
+    }
+
+    if (new_settings.background_download_threads != actual_settings.background_download_threads)
+    {
+        bool updated = false;
+        try
+        {
+            updated = metadata.setBackgroundDownloadThreads(new_settings.background_download_threads);
+        }
+        catch (...)
+        {
+            actual_settings.background_download_threads = metadata.getBackgroundDownloadThreads();
+            throw;
+        }
+
+        if (updated)
+        {
+            LOG_INFO(log, "Changed background_download_threads from {} to {}",
+                    actual_settings.background_download_threads,
+                    new_settings.background_download_threads);
+
+            actual_settings.background_download_threads = new_settings.background_download_threads;
+        }
+    }
+
+
+    if (new_settings.max_size != actual_settings.max_size
+        || new_settings.max_elements != actual_settings.max_elements)
+    {
+        auto cache_lock = lockCache();
+
+        bool updated = false;
+        try
+        {
+            updated = main_priority->modifySizeLimits(
+                new_settings.max_size, new_settings.max_elements, new_settings.slru_size_ratio, cache_lock);
+        }
+        catch (...)
+        {
+            actual_settings.max_size = main_priority->getSizeLimit(cache_lock);
+            actual_settings.max_elements = main_priority->getElementsLimit(cache_lock);
+            throw;
+        }
+
+        if (updated)
+        {
+            LOG_INFO(log, "Changed max_size from {} to {}, max_elements from {} to {}",
+                    actual_settings.max_size, new_settings.max_size,
+                    actual_settings.max_elements, new_settings.max_elements);
+
+            actual_settings.max_size = main_priority->getSizeLimit(cache_lock);
+            actual_settings.max_elements = main_priority->getElementsLimit(cache_lock);
+        }
+    }
+}
+
 FileCache::QueryContextHolder::QueryContextHolder(
     const String & query_id_,
     FileCache * cache_,
@@ -1371,19 +1310,19 @@ FileCache::QueryContextHolder::~QueryContextHolder()
 }
 
 FileCache::QueryContextHolderPtr FileCache::getQueryContextHolder(
-    const String & query_id, const ReadSettings & settings)
+    const String & query_id, const ReadSettings & read_settings)
 {
-    if (!query_limit || settings.filesystem_cache_max_download_size == 0)
+    if (!query_limit || read_settings.filesystem_cache_max_download_size == 0)
         return {};
 
     auto lock = lockCache();
-    auto context = query_limit->getOrSetQueryContext(query_id, settings, lock);
+    auto context = query_limit->getOrSetQueryContext(query_id, read_settings, lock);
     return std::make_unique<QueryContextHolder>(query_id, this, std::move(context));
 }
 
-FileSegments FileCache::sync()
+std::vector<FileSegment::Info> FileCache::sync()
 {
-    FileSegments file_segments;
+    std::vector<FileSegment::Info> file_segments;
     metadata.iterate([&](LockedKey & locked_key)
     {
         auto broken = locked_key.sync();
@@ -1392,4 +1331,17 @@ FileSegments FileCache::sync()
     return file_segments;
 }
 
+FileCache::HitsCountStash::HitsCountStash(size_t hits_threashold_, size_t queue_size_)
+    : hits_threshold(hits_threashold_), queue_size(queue_size_), queue(std::make_unique<LRUFileCachePriority>(0, queue_size_))
+{
+    if (!queue_size_)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Queue size for hits queue must be non-zero");
+}
+
+void FileCache::HitsCountStash::clear()
+{
+    records.clear();
+    queue = std::make_unique<LRUFileCachePriority>(0, queue_size);
+}
+
 }
diff --git a/src/Interpreters/Cache/FileCache.h b/src/Interpreters/Cache/FileCache.h
index 7485c7d2b90..11d35535e9e 100644
--- a/src/Interpreters/Cache/FileCache.h
+++ b/src/Interpreters/Cache/FileCache.h
@@ -16,31 +16,30 @@
 #include <Interpreters/Cache/Metadata.h>
 #include <Interpreters/Cache/QueryLimit.h>
 #include <Interpreters/Cache/FileCache_fwd_internal.h>
+#include <Interpreters/Cache/FileCacheSettings.h>
 #include <filesystem>
 
 
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int BAD_ARGUMENTS;
-}
-
 /// Track acquired space in cache during reservation
 /// to make error messages when no space left more informative.
 struct FileCacheReserveStat
 {
     struct Stat
     {
-        size_t releasable_size;
-        size_t releasable_count;
+        size_t releasable_size = 0;
+        size_t releasable_count = 0;
 
-        size_t non_releasable_size;
-        size_t non_releasable_count;
+        size_t non_releasable_size = 0;
+        size_t non_releasable_count = 0;
     };
 
+    Stat stat;
     std::unordered_map<FileSegmentKind, Stat> stat_by_kind;
+
+    void update(size_t size, FileSegmentKind kind, bool releasable);
 };
 
 /// Local cache for remote filesystem files, represented as a set of non-overlapping non-empty file segments.
@@ -52,8 +51,6 @@ public:
     using QueryLimit = DB::FileCacheQueryLimit;
     using Priority = IFileCachePriority;
     using PriorityEntry = IFileCachePriority::Entry;
-    using PriorityIterator = IFileCachePriority::Iterator;
-    using PriorityIterationResult = IFileCachePriority::IterationResult;
 
     FileCache(const std::string & cache_name, const FileCacheSettings & settings);
 
@@ -126,11 +123,11 @@ public:
 
     bool tryReserve(FileSegment & file_segment, size_t size, FileCacheReserveStat & stat);
 
-    FileSegments getSnapshot();
+    std::vector<FileSegment::Info> getFileSegmentInfos();
 
-    FileSegments getSnapshot(const Key & key);
+    std::vector<FileSegment::Info> getFileSegmentInfos(const Key & key);
 
-    FileSegments dumpQueue();
+    std::vector<FileSegment::Info> dumpQueue();
 
     void deactivateBackgroundOperations();
 
@@ -152,16 +149,20 @@ public:
 
     CacheGuard::Lock lockCache() const;
 
-    FileSegments sync();
+    std::vector<FileSegment::Info> sync();
+
+    using IterateFunc = std::function<void(const FileSegmentInfo &)>;
+    void iterate(IterateFunc && func);
+
+    void applySettingsIfPossible(const FileCacheSettings & new_settings, FileCacheSettings & actual_settings);
 
 private:
     using KeyAndOffset = FileCacheKeyAndOffset;
 
     const size_t max_file_segment_size;
-    const size_t bypass_cache_threshold = 0;
+    const size_t bypass_cache_threshold;
     const size_t boundary_alignment;
-    const size_t background_download_threads; /// 0 means background download is disabled.
-    const size_t metadata_download_threads;
+    size_t load_metadata_threads;
 
     Poco::Logger * log;
 
@@ -169,6 +170,9 @@ private:
     std::atomic<bool> is_initialized = false;
     mutable std::mutex init_mutex;
     std::unique_ptr<StatusFile> status_file;
+    std::atomic<bool> shutdown = false;
+
+    std::mutex apply_settings_mutex;
 
     CacheMetadata metadata;
 
@@ -177,16 +181,14 @@ private:
 
     struct HitsCountStash
     {
-        HitsCountStash(size_t hits_threashold_, size_t queue_size_)
-            : hits_threshold(hits_threashold_), queue(std::make_unique<LRUFileCachePriority>(0, queue_size_))
-        {
-            if (!queue_size_)
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "Queue size for hits queue must be non-zero");
-        }
+        HitsCountStash(size_t hits_threashold_, size_t queue_size_);
+        void clear();
 
         const size_t hits_threshold;
-        FileCachePriorityPtr queue;
-        using Records = std::unordered_map<KeyAndOffset, PriorityIterator, FileCacheKeyAndOffsetHash>;
+        const size_t queue_size;
+
+        std::unique_ptr<LRUFileCachePriority> queue;
+        using Records = std::unordered_map<KeyAndOffset, Priority::IteratorPtr, FileCacheKeyAndOffsetHash>;
         Records records;
     };
 
@@ -201,12 +203,6 @@ private:
      * then allowed loaded cache size is std::min(n - k, max_query_cache_size).
      */
     FileCacheQueryLimitPtr query_limit;
-    /**
-     * A background cleanup task.
-     * Clears removed cache entries from metadata.
-     */
-    std::vector<ThreadFromGlobalPool> download_threads;
-    std::unique_ptr<ThreadFromGlobalPool> cleanup_thread;
 
     void assertInitialized() const;
     void assertCacheCorrectness();
diff --git a/src/Interpreters/Cache/FileCacheFactory.cpp b/src/Interpreters/Cache/FileCacheFactory.cpp
index ef04262f956..3e857d8a8e3 100644
--- a/src/Interpreters/Cache/FileCacheFactory.cpp
+++ b/src/Interpreters/Cache/FileCacheFactory.cpp
@@ -9,6 +9,28 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
 }
 
+FileCacheFactory::FileCacheData::FileCacheData(
+    FileCachePtr cache_,
+    const FileCacheSettings & settings_,
+    const std::string & config_path_)
+    : cache(cache_)
+    , config_path(config_path_)
+    , settings(settings_)
+{
+}
+
+FileCacheSettings FileCacheFactory::FileCacheData::getSettings() const
+{
+    std::lock_guard lock(settings_mutex);
+    return settings;
+}
+
+void FileCacheFactory::FileCacheData::setSettings(const FileCacheSettings & new_settings)
+{
+    std::lock_guard lock(settings_mutex);
+    settings = new_settings;
+}
+
 FileCacheFactory & FileCacheFactory::instance()
 {
     static FileCacheFactory ret;
@@ -22,22 +44,86 @@ FileCacheFactory::CacheByName FileCacheFactory::getAll()
 }
 
 FileCachePtr FileCacheFactory::getOrCreate(
-    const std::string & cache_name, const FileCacheSettings & file_cache_settings)
+    const std::string & cache_name,
+    const FileCacheSettings & file_cache_settings,
+    const std::string & config_path)
 {
     std::lock_guard lock(mutex);
 
-    auto it = caches_by_name.find(cache_name);
+    auto it = std::find_if(caches_by_name.begin(), caches_by_name.end(), [&](const auto & cache_by_name)
+    {
+        return cache_by_name.second->getSettings().base_path == file_cache_settings.base_path;
+    });
+
     if (it == caches_by_name.end())
     {
         auto cache = std::make_shared<FileCache>(cache_name, file_cache_settings);
-        it = caches_by_name.emplace(
-            cache_name, std::make_unique<FileCacheData>(cache, file_cache_settings)).first;
+
+        bool inserted;
+        std::tie(it, inserted) = caches_by_name.emplace(
+            cache_name, std::make_unique<FileCacheData>(cache, file_cache_settings, config_path));
+
+        if (!inserted)
+        {
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                            "Cache with name {} exists, but it has a different path", cache_name);
+        }
+    }
+    else if (it->second->getSettings() != file_cache_settings)
+    {
+        throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                        "Found more than one cache configuration with the same path, "
+                        "but with different cache settings ({} and {})",
+                        it->first, cache_name);
+    }
+    else if (it->first != cache_name)
+    {
+        caches_by_name.emplace(cache_name, it->second);
     }
 
     return it->second->cache;
 }
 
-FileCacheFactory::FileCacheData FileCacheFactory::getByName(const std::string & cache_name)
+FileCachePtr FileCacheFactory::create(
+    const std::string & cache_name,
+    const FileCacheSettings & file_cache_settings,
+    const std::string & config_path)
+{
+    std::lock_guard lock(mutex);
+
+    auto it = caches_by_name.find(cache_name);
+
+    if (it != caches_by_name.end())
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Cache with name {} already exists", cache_name);
+
+    it = std::find_if(caches_by_name.begin(), caches_by_name.end(), [&](const auto & cache_by_name)
+    {
+        return cache_by_name.second->getSettings().base_path == file_cache_settings.base_path;
+    });
+
+    if (it == caches_by_name.end())
+    {
+        auto cache = std::make_shared<FileCache>(cache_name, file_cache_settings);
+        it = caches_by_name.emplace(
+            cache_name, std::make_unique<FileCacheData>(cache, file_cache_settings, config_path)).first;
+    }
+    else if (it->second->getSettings() != file_cache_settings)
+    {
+        throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                        "Found more than one cache configuration with the same path, "
+                        "but with different cache settings ({} and {})",
+                        it->first, cache_name);
+    }
+    else
+    {
+        [[maybe_unused]] bool inserted = caches_by_name.emplace(cache_name, it->second).second;
+        chassert(inserted);
+    }
+
+    return it->second->cache;
+}
+
+FileCacheFactory::FileCacheDataPtr FileCacheFactory::getByName(const std::string & cache_name)
 {
     std::lock_guard lock(mutex);
 
@@ -45,7 +131,46 @@ FileCacheFactory::FileCacheData FileCacheFactory::getByName(const std::string &
     if (it == caches_by_name.end())
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "There is no cache by name: {}", cache_name);
 
-    return *it->second;
+    return it->second;
+}
+
+void FileCacheFactory::updateSettingsFromConfig(const Poco::Util::AbstractConfiguration & config)
+{
+    CacheByName caches_by_name_copy;
+    {
+        std::lock_guard lock(mutex);
+        caches_by_name_copy = caches_by_name;
+    }
+
+    std::unordered_set<std::string> checked_paths;
+    for (const auto & [_, cache_info] : caches_by_name_copy)
+    {
+        if (cache_info->config_path.empty() || checked_paths.contains(cache_info->config_path))
+            continue;
+
+        checked_paths.emplace(cache_info->config_path);
+
+        FileCacheSettings new_settings;
+        new_settings.loadFromConfig(config, cache_info->config_path);
+
+        FileCacheSettings old_settings = cache_info->getSettings();
+        if (old_settings == new_settings)
+            continue;
+
+        try
+        {
+            cache_info->cache->applySettingsIfPossible(new_settings, old_settings);
+        }
+        catch (...)
+        {
+            /// Settings changes could be partially applied in case of exception,
+            /// make sure cache_info->settings show correct state of applied settings.
+            cache_info->setSettings(old_settings);
+            throw;
+        }
+
+        cache_info->setSettings(old_settings);
+    }
 }
 
 }
diff --git a/src/Interpreters/Cache/FileCacheFactory.h b/src/Interpreters/Cache/FileCacheFactory.h
index 13e07074a97..c60b247005b 100644
--- a/src/Interpreters/Cache/FileCacheFactory.h
+++ b/src/Interpreters/Cache/FileCacheFactory.h
@@ -6,7 +6,6 @@
 #include <boost/noncopyable.hpp>
 #include <unordered_map>
 #include <mutex>
-#include <list>
 
 namespace DB
 {
@@ -17,24 +16,44 @@ namespace DB
 class FileCacheFactory final : private boost::noncopyable
 {
 public:
-    struct FileCacheData
+    class FileCacheData
     {
-        FileCachePtr cache;
-        FileCacheSettings settings;
+        friend class FileCacheFactory;
+    public:
+        FileCacheData(FileCachePtr cache_, const FileCacheSettings & settings_, const std::string & config_path_);
 
-        FileCacheData() = default;
-        FileCacheData(FileCachePtr cache_, const FileCacheSettings & settings_) : cache(cache_), settings(settings_) {}
+        FileCacheSettings getSettings() const;
+
+        void setSettings(const FileCacheSettings & new_settings);
+
+        const FileCachePtr cache;
+        const std::string config_path;
+
+    private:
+        FileCacheSettings settings;
+        mutable std::mutex settings_mutex;
     };
+
     using FileCacheDataPtr = std::shared_ptr<FileCacheData>;
     using CacheByName = std::unordered_map<std::string, FileCacheDataPtr>;
 
     static FileCacheFactory & instance();
 
-    FileCachePtr getOrCreate(const std::string & cache_name, const FileCacheSettings & file_cache_settings);
+    FileCachePtr getOrCreate(
+        const std::string & cache_name,
+        const FileCacheSettings & file_cache_settings,
+        const std::string & config_path);
+
+    FileCachePtr create(
+        const std::string & cache_name,
+        const FileCacheSettings & file_cache_settings,
+        const std::string & config_path);
 
     CacheByName getAll();
 
-    FileCacheData getByName(const std::string & cache_name);
+    FileCacheDataPtr getByName(const std::string & cache_name);
+
+    void updateSettingsFromConfig(const Poco::Util::AbstractConfiguration & config);
 
 private:
     std::mutex mutex;
diff --git a/src/Interpreters/Cache/FileCacheSettings.cpp b/src/Interpreters/Cache/FileCacheSettings.cpp
index a4eefbd7115..692d48c6ce6 100644
--- a/src/Interpreters/Cache/FileCacheSettings.cpp
+++ b/src/Interpreters/Cache/FileCacheSettings.cpp
@@ -3,6 +3,7 @@
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Common/Exception.h>
 #include <Common/NamedCollections/NamedCollections.h>
+#include <boost/algorithm/string/case_conv.hpp>
 #include <IO/ReadHelpers.h>
 
 namespace DB
@@ -13,7 +14,7 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
 }
 
-void FileCacheSettings::loadImpl(FuncHas has, FuncGetUInt get_uint, FuncGetString get_string)
+void FileCacheSettings::loadImpl(FuncHas has, FuncGetUInt get_uint, FuncGetString get_string, FuncGetDouble get_double)
 {
     auto config_parse_size = [&](std::string_view key) { return parseWithSizeSuffix<uint64_t>(get_string(key)); };
 
@@ -64,6 +65,15 @@ void FileCacheSettings::loadImpl(FuncHas has, FuncGetUInt get_uint, FuncGetStrin
 
     if (boundary_alignment > max_file_segment_size)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Setting `boundary_alignment` cannot exceed `max_file_segment_size`");
+
+    if (has("cache_policy"))
+    {
+        cache_policy = get_string("cache_policy");
+        boost::to_upper(cache_policy);
+    }
+
+    if (has("slru_size_ratio"))
+        slru_size_ratio = get_double("slru_size_ratio");
 }
 
 void FileCacheSettings::loadFromConfig(const Poco::Util::AbstractConfiguration & config, const std::string & config_prefix)
@@ -71,15 +81,17 @@ void FileCacheSettings::loadFromConfig(const Poco::Util::AbstractConfiguration &
     auto config_has = [&](std::string_view key) { return config.has(fmt::format("{}.{}", config_prefix, key)); };
     auto config_get_uint = [&](std::string_view key) { return config.getUInt(fmt::format("{}.{}", config_prefix, key)); };
     auto config_get_string = [&](std::string_view key) { return config.getString(fmt::format("{}.{}", config_prefix, key)); };
-    loadImpl(std::move(config_has), std::move(config_get_uint), std::move(config_get_string));
+    auto config_get_double = [&](std::string_view key) { return config.getDouble(fmt::format("{}.{}", config_prefix, key)); };
+    loadImpl(std::move(config_has), std::move(config_get_uint), std::move(config_get_string), std::move(config_get_double));
 }
 
 void FileCacheSettings::loadFromCollection(const NamedCollection & collection)
 {
-    auto config_has = [&](std::string_view key) { return collection.has(std::string(key)); };
-    auto config_get_uint = [&](std::string_view key) { return collection.get<UInt64>(std::string(key)); };
-    auto config_get_string = [&](std::string_view key) { return collection.get<String>(std::string(key)); };
-    loadImpl(std::move(config_has), std::move(config_get_uint), std::move(config_get_string));
+    auto collection_has = [&](std::string_view key) { return collection.has(std::string(key)); };
+    auto collection_get_uint = [&](std::string_view key) { return collection.get<UInt64>(std::string(key)); };
+    auto collection_get_string = [&](std::string_view key) { return collection.get<String>(std::string(key)); };
+    auto collection_get_double = [&](std::string_view key) { return collection.get<Float64>(std::string(key)); };
+    loadImpl(std::move(collection_has), std::move(collection_get_uint), std::move(collection_get_string), std::move(collection_get_double));
 }
 
 }
diff --git a/src/Interpreters/Cache/FileCacheSettings.h b/src/Interpreters/Cache/FileCacheSettings.h
index bcc15f7b204..eafd7aafb29 100644
--- a/src/Interpreters/Cache/FileCacheSettings.h
+++ b/src/Interpreters/Cache/FileCacheSettings.h
@@ -32,14 +32,20 @@ struct FileCacheSettings
 
     size_t load_metadata_threads = FILECACHE_DEFAULT_LOAD_METADATA_THREADS;
 
+    std::string cache_policy = "LRU";
+    double slru_size_ratio = 0.5;
+
     void loadFromConfig(const Poco::Util::AbstractConfiguration & config, const std::string & config_prefix);
     void loadFromCollection(const NamedCollection & collection);
 
+    bool operator ==(const FileCacheSettings &) const = default;
+
 private:
     using FuncHas = std::function<bool(std::string_view)>;
     using FuncGetUInt = std::function<size_t(std::string_view)>;
     using FuncGetString = std::function<std::string(std::string_view)>;
-    void loadImpl(FuncHas has, FuncGetUInt get_uint, FuncGetString get_string);
+    using FuncGetDouble = std::function<double(std::string_view)>;
+    void loadImpl(FuncHas has, FuncGetUInt get_uint, FuncGetString get_string, FuncGetDouble get_double);
 };
 
 }
diff --git a/src/Interpreters/Cache/FileCache_fwd.h b/src/Interpreters/Cache/FileCache_fwd.h
index e2f7f54e203..06261b19db7 100644
--- a/src/Interpreters/Cache/FileCache_fwd.h
+++ b/src/Interpreters/Cache/FileCache_fwd.h
@@ -8,7 +8,7 @@ static constexpr int FILECACHE_DEFAULT_MAX_FILE_SEGMENT_SIZE = 32 * 1024 * 1024;
 static constexpr int FILECACHE_DEFAULT_FILE_SEGMENT_ALIGNMENT = 4 * 1024 * 1024; /// 4Mi
 static constexpr int FILECACHE_DEFAULT_BACKGROUND_DOWNLOAD_THREADS = 5;
 static constexpr int FILECACHE_DEFAULT_BACKGROUND_DOWNLOAD_QUEUE_SIZE_LIMIT = 5000;
-static constexpr int FILECACHE_DEFAULT_LOAD_METADATA_THREADS = 1;
+static constexpr int FILECACHE_DEFAULT_LOAD_METADATA_THREADS = 16;
 static constexpr int FILECACHE_DEFAULT_MAX_ELEMENTS = 10000000;
 static constexpr int FILECACHE_DEFAULT_HITS_THRESHOLD = 0;
 static constexpr size_t FILECACHE_BYPASS_THRESHOLD = 256 * 1024 * 1024;
diff --git a/src/Interpreters/Cache/FileSegment.cpp b/src/Interpreters/Cache/FileSegment.cpp
index dc1b64f09dd..170d1e1092c 100644
--- a/src/Interpreters/Cache/FileSegment.cpp
+++ b/src/Interpreters/Cache/FileSegment.cpp
@@ -54,7 +54,7 @@ FileSegment::FileSegment(
         bool background_download_enabled_,
         FileCache * cache_,
         std::weak_ptr<KeyMetadata> key_metadata_,
-        Priority::Iterator queue_iterator_)
+        Priority::IteratorPtr queue_iterator_)
     : file_key(key_)
     , segment_range(offset_, offset_ + size_ - 1)
     , segment_kind(settings.kind)
@@ -120,6 +120,14 @@ String FileSegment::getPathInLocalCache() const
     return getKeyMetadata()->getFileSegmentPath(*this);
 }
 
+String FileSegment::tryGetPathInLocalCache() const
+{
+    auto metadata = tryGetKeyMetadata();
+    if (!metadata)
+        return "";
+    return metadata->getFileSegmentPath(*this);
+}
+
 FileSegmentGuard::Lock FileSegment::lockFileSegment() const
 {
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentLockMicroseconds);
@@ -146,13 +154,13 @@ size_t FileSegment::getReservedSize() const
     return reserved_size;
 }
 
-FileSegment::Priority::Iterator FileSegment::getQueueIterator() const
+FileSegment::Priority::IteratorPtr FileSegment::getQueueIterator() const
 {
     auto lock = lockFileSegment();
     return queue_iterator;
 }
 
-void FileSegment::setQueueIterator(Priority::Iterator iterator)
+void FileSegment::setQueueIterator(Priority::IteratorPtr iterator)
 {
     auto lock = lockFileSegment();
     if (queue_iterator)
@@ -480,7 +488,7 @@ bool FileSegment::reserve(size_t size_to_reserve, FileCacheReserveStat * reserve
 
     bool is_file_segment_size_exceeded;
     {
-        auto lock = segment_guard.lock();
+        auto lock = lockFileSegment();
 
         assertNotDetachedUnlocked(lock);
         assertIsDownloaderUnlocked("reserve", lock);
@@ -773,7 +781,7 @@ bool FileSegment::assertCorrectness() const
 
 bool FileSegment::assertCorrectnessUnlocked(const FileSegmentGuard::Lock &) const
 {
-    auto check_iterator = [this](const Priority::Iterator & it)
+    auto check_iterator = [this](const Priority::IteratorPtr & it)
     {
         UNUSED(this);
         if (!it)
@@ -833,23 +841,24 @@ void FileSegment::assertNotDetachedUnlocked(const FileSegmentGuard::Lock & lock)
     }
 }
 
-FileSegmentPtr FileSegment::getSnapshot(const FileSegmentPtr & file_segment)
+FileSegment::Info FileSegment::getInfo(const FileSegmentPtr & file_segment)
 {
     auto lock = file_segment->lockFileSegment();
-
-    auto snapshot = std::make_shared<FileSegment>(
-        file_segment->key(),
-        file_segment->offset(),
-        file_segment->range().size(),
-        State::DETACHED,
-        CreateFileSegmentSettings(file_segment->getKind(), file_segment->is_unbound));
-
-    snapshot->hits_count = file_segment->getHitsCount();
-    snapshot->downloaded_size = file_segment->getDownloadedSize();
-    snapshot->download_state = file_segment->download_state.load();
-    snapshot->ref_count = file_segment.use_count();
-
-    return snapshot;
+    return Info{
+        .key = file_segment->key(),
+        .offset = file_segment->offset(),
+        .path = file_segment->tryGetPathInLocalCache(),
+        .range_left = file_segment->range().left,
+        .range_right = file_segment->range().right,
+        .kind = file_segment->segment_kind,
+        .state = file_segment->download_state,
+        .size = file_segment->range().size(),
+        .downloaded_size = file_segment->downloaded_size,
+        .cache_hits = file_segment->hits_count,
+        .references = static_cast<uint64_t>(file_segment.use_count()),
+        .is_unbound = file_segment->is_unbound,
+        .queue_entry_type = file_segment->queue_iterator ? file_segment->queue_iterator->getType() : QueueEntryType::None,
+    };
 }
 
 bool FileSegment::isDetached() const
@@ -904,7 +913,7 @@ void FileSegment::detach(const FileSegmentGuard::Lock & lock, const LockedKey &)
     setDetachedState(lock);
 }
 
-void FileSegment::use()
+void FileSegment::increasePriority()
 {
     ProfileEventTimeIncrement<Microseconds> watch(ProfileEvents::FileSegmentUseMicroseconds);
 
@@ -918,7 +927,7 @@ void FileSegment::use()
     if (it)
     {
         auto cache_lock = cache->lockCache();
-        hits_count = it->use(cache_lock);
+        hits_count = it->increasePriority(cache_lock);
     }
 }
 
diff --git a/src/Interpreters/Cache/FileSegment.h b/src/Interpreters/Cache/FileSegment.h
index 3a73fc27ba9..d2c7ac9f90c 100644
--- a/src/Interpreters/Cache/FileSegment.h
+++ b/src/Interpreters/Cache/FileSegment.h
@@ -11,8 +11,8 @@
 #include <IO/OpenedFileCache.h>
 #include <base/getThreadId.h>
 #include <Interpreters/Cache/IFileCachePriority.h>
+#include <Interpreters/Cache/FileSegmentInfo.h>
 #include <Interpreters/Cache/FileCache_fwd_internal.h>
-#include <queue>
 
 
 namespace Poco { class Logger; }
@@ -28,23 +28,6 @@ namespace DB
 class ReadBufferFromFileBase;
 struct FileCacheReserveStat;
 
-/*
- * FileSegmentKind is used to specify the eviction policy for file segments.
- */
-enum class FileSegmentKind
-{
-    /* `Regular` file segment is still in cache after usage, and can be evicted
-     * (unless there're some holders).
-     */
-    Regular,
-
-    /* `Temporary` file segment is removed right after releasing.
-     * Also corresponding files are removed during cache loading (if any).
-     */
-    Temporary,
-};
-
-String toString(FileSegmentKind kind);
 
 struct CreateFileSegmentSettings
 {
@@ -69,40 +52,9 @@ public:
     using Downloader = std::string;
     using DownloaderId = std::string;
     using Priority = IFileCachePriority;
-
-    enum class State
-    {
-        DOWNLOADED,
-        /**
-         * When file segment is first created and returned to user, it has state EMPTY.
-         * EMPTY state can become DOWNLOADING when getOrSetDownaloder is called successfully
-         * by any owner of EMPTY state file segment.
-         */
-        EMPTY,
-        /**
-         * A newly created file segment never has DOWNLOADING state until call to getOrSetDownloader
-         * because each cache user might acquire multiple file segments and read them one by one,
-         * so only user which actually needs to read this segment earlier than others - becomes a downloader.
-         */
-        DOWNLOADING,
-        /**
-         * Space reservation for a file segment is incremental, i.e. downloader reads buffer_size bytes
-         * from remote fs -> tries to reserve buffer_size bytes to put them to cache -> writes to cache
-         * on successful reservation and stops cache write otherwise. Those, who waited for the same file
-         * segment, will read downloaded part from cache and remaining part directly from remote fs.
-         */
-        PARTIALLY_DOWNLOADED_NO_CONTINUATION,
-        /**
-         * If downloader did not finish download of current file segment for any reason apart from running
-         * out of cache space, then download can be continued by other owners of this file segment.
-         */
-        PARTIALLY_DOWNLOADED,
-        /**
-         * If file segment cannot possibly be downloaded (first space reservation attempt failed), mark
-         * this file segment as out of cache scope.
-         */
-        DETACHED,
-    };
+    using State = FileSegmentState;
+    using Info = FileSegmentInfo;
+    using QueueEntryType = FileCacheQueueEntryType;
 
     FileSegment(
         const Key & key_,
@@ -113,7 +65,7 @@ public:
         bool background_download_enabled_ = false,
         FileCache * cache_ = nullptr,
         std::weak_ptr<KeyMetadata> key_metadata_ = std::weak_ptr<KeyMetadata>(),
-        Priority::Iterator queue_iterator_ = Priority::Iterator{});
+        Priority::IteratorPtr queue_iterator_ = nullptr);
 
     ~FileSegment() = default;
 
@@ -205,7 +157,7 @@ public:
     /// exception.
     void detach(const FileSegmentGuard::Lock &, const LockedKey &);
 
-    static FileSegmentPtr getSnapshot(const FileSegmentPtr & file_segment);
+    static FileSegmentInfo getInfo(const FileSegmentPtr & file_segment);
 
     bool isDetached() const;
 
@@ -213,7 +165,7 @@ public:
     /// is not going to be changed. Completed states: DOWNALODED, DETACHED.
     bool isCompleted(bool sync = false) const;
 
-    void use();
+    void increasePriority();
 
     /**
      * ========== Methods used by `cache` ========================
@@ -221,9 +173,9 @@ public:
 
     FileSegmentGuard::Lock lock() const { return segment_guard.lock(); }
 
-    Priority::Iterator getQueueIterator() const;
+    Priority::IteratorPtr getQueueIterator() const;
 
-    void setQueueIterator(Priority::Iterator iterator);
+    void setQueueIterator(Priority::IteratorPtr iterator);
 
     KeyMetadataPtr tryGetKeyMetadata() const;
 
@@ -291,6 +243,8 @@ private:
     LockedKeyPtr lockKeyMetadata(bool assert_exists = true) const;
     FileSegmentGuard::Lock lockFileSegment() const;
 
+    String tryGetPathInLocalCache() const;
+
     Key file_key;
     Range segment_range;
     const FileSegmentKind segment_kind;
@@ -311,7 +265,7 @@ private:
 
     mutable FileSegmentGuard segment_guard;
     std::weak_ptr<KeyMetadata> key_metadata;
-    mutable Priority::Iterator queue_iterator; /// Iterator is put here on first reservation attempt, if successful.
+    mutable Priority::IteratorPtr queue_iterator; /// Iterator is put here on first reservation attempt, if successful.
     FileCache * cache;
     std::condition_variable cv;
 
@@ -341,8 +295,10 @@ struct FileSegmentsHolder : private boost::noncopyable
     void popFront() { completeAndPopFrontImpl(); }
 
     FileSegment & front() { return *file_segments.front(); }
+    const FileSegment & front() const { return *file_segments.front(); }
 
     FileSegment & back() { return *file_segments.back(); }
+    const FileSegment & back() const { return *file_segments.back(); }
 
     FileSegment & add(FileSegmentPtr && file_segment);
 
diff --git a/src/Interpreters/Cache/FileSegmentInfo.h b/src/Interpreters/Cache/FileSegmentInfo.h
new file mode 100644
index 00000000000..bb87cbbc15d
--- /dev/null
+++ b/src/Interpreters/Cache/FileSegmentInfo.h
@@ -0,0 +1,82 @@
+#pragma once
+#include <Interpreters/Cache/FileCache_fwd.h>
+#include <Interpreters/Cache/FileCacheKey.h>
+
+namespace DB
+{
+    enum class FileSegmentState
+    {
+        DOWNLOADED,
+        /**
+         * When file segment is first created and returned to user, it has state EMPTY.
+         * EMPTY state can become DOWNLOADING when getOrSetDownaloder is called successfully
+         * by any owner of EMPTY state file segment.
+         */
+        EMPTY,
+        /**
+         * A newly created file segment never has DOWNLOADING state until call to getOrSetDownloader
+         * because each cache user might acquire multiple file segments and read them one by one,
+         * so only user which actually needs to read this segment earlier than others - becomes a downloader.
+         */
+        DOWNLOADING,
+        /**
+         * Space reservation for a file segment is incremental, i.e. downloader reads buffer_size bytes
+         * from remote fs -> tries to reserve buffer_size bytes to put them to cache -> writes to cache
+         * on successful reservation and stops cache write otherwise. Those, who waited for the same file
+         * segment, will read downloaded part from cache and remaining part directly from remote fs.
+         */
+        PARTIALLY_DOWNLOADED_NO_CONTINUATION,
+        /**
+         * If downloader did not finish download of current file segment for any reason apart from running
+         * out of cache space, then download can be continued by other owners of this file segment.
+         */
+        PARTIALLY_DOWNLOADED,
+        /**
+         * If file segment cannot possibly be downloaded (first space reservation attempt failed), mark
+         * this file segment as out of cache scope.
+         */
+        DETACHED,
+    };
+
+    enum class FileSegmentKind
+    {
+        /**
+         * `Regular` file segment is still in cache after usage, and can be evicted
+         * (unless there're some holders).
+         */
+        Regular,
+
+        /**
+         * Temporary` file segment is removed right after releasing.
+         * Also corresponding files are removed during cache loading (if any).
+         */
+        Temporary,
+    };
+
+    enum class FileCacheQueueEntryType
+    {
+        None,
+        LRU,
+        SLRU_Protected,
+        SLRU_Probationary,
+    };
+
+    std::string toString(FileSegmentKind kind);
+
+    struct FileSegmentInfo
+    {
+        FileCacheKey key;
+        size_t offset;
+        std::string path;
+        uint64_t range_left;
+        uint64_t range_right;
+        FileSegmentKind kind;
+        FileSegmentState state;
+        uint64_t size;
+        uint64_t downloaded_size;
+        uint64_t cache_hits;
+        uint64_t references;
+        bool is_unbound;
+        FileCacheQueueEntryType queue_entry_type;
+    };
+}
diff --git a/src/Interpreters/Cache/IFileCachePriority.cpp b/src/Interpreters/Cache/IFileCachePriority.cpp
new file mode 100644
index 00000000000..eb396a1e323
--- /dev/null
+++ b/src/Interpreters/Cache/IFileCachePriority.cpp
@@ -0,0 +1,40 @@
+#include <Interpreters/Cache/IFileCachePriority.h>
+#include <Common/CurrentMetrics.h>
+
+
+namespace CurrentMetrics
+{
+    extern const Metric FilesystemCacheSizeLimit;
+}
+
+namespace DB
+{
+
+IFileCachePriority::IFileCachePriority(size_t max_size_, size_t max_elements_)
+    : max_size(max_size_), max_elements(max_elements_)
+{
+    CurrentMetrics::add(CurrentMetrics::FilesystemCacheSizeLimit, max_size_);
+}
+
+IFileCachePriority::Entry::Entry(
+    const Key & key_,
+    size_t offset_,
+    size_t size_,
+    KeyMetadataPtr key_metadata_)
+    : key(key_)
+    , offset(offset_)
+    , key_metadata(key_metadata_)
+    , size(size_)
+{
+}
+
+IFileCachePriority::Entry::Entry(const Entry & other)
+    : key(other.key)
+    , offset(other.offset)
+    , key_metadata(other.key_metadata)
+    , size(other.size.load())
+    , hits(other.hits)
+{
+}
+
+}
diff --git a/src/Interpreters/Cache/IFileCachePriority.h b/src/Interpreters/Cache/IFileCachePriority.h
index 7de380c163b..c07f6fb9fb4 100644
--- a/src/Interpreters/Cache/IFileCachePriority.h
+++ b/src/Interpreters/Cache/IFileCachePriority.h
@@ -1,98 +1,96 @@
 #pragma once
 
 #include <memory>
-#include <mutex>
 #include <Core/Types.h>
 #include <Common/Exception.h>
-#include <Interpreters/Cache/FileCacheKey.h>
+#include <Interpreters/Cache/FileSegmentInfo.h>
 #include <Interpreters/Cache/Guards.h>
+#include <Interpreters/Cache/IFileCachePriority.h>
 #include <Interpreters/Cache/FileCache_fwd_internal.h>
 
 namespace DB
 {
+struct FileCacheReserveStat;
+class EvictionCandidates;
 
-/// IFileCachePriority is used to maintain the priority of cached data.
 class IFileCachePriority : private boost::noncopyable
 {
 public:
     using Key = FileCacheKey;
-    using KeyAndOffset = FileCacheKeyAndOffset;
+    using QueueEntryType = FileCacheQueueEntryType;
 
     struct Entry
     {
-        Entry(const Key & key_, size_t offset_, size_t size_, KeyMetadataPtr key_metadata_)
-            : key(key_), offset(offset_), size(size_), key_metadata(key_metadata_) {}
-
-        Entry(const Entry & other)
-            : key(other.key), offset(other.offset), size(other.size.load()), hits(other.hits), key_metadata(other.key_metadata) {}
+        Entry(const Key & key_, size_t offset_, size_t size_, KeyMetadataPtr key_metadata_);
+        Entry(const Entry & other);
 
         const Key key;
         const size_t offset;
+        const KeyMetadataPtr key_metadata;
+
         std::atomic<size_t> size;
         size_t hits = 0;
-        const KeyMetadataPtr key_metadata;
     };
 
-    /// Provides an iterator to traverse the cache priority. Under normal circumstances,
-    /// the iterator can only return the records that have been directly swapped out.
-    /// For example, in the LRU algorithm, it can traverse all records, but in the LRU-K, it
-    /// can only traverse the records in the low priority queue.
-    class IIterator
+    class Iterator
     {
     public:
-        virtual ~IIterator() = default;
-
-        virtual size_t use(const CacheGuard::Lock &) = 0;
-
-        virtual void remove(const CacheGuard::Lock &) = 0;
+        virtual ~Iterator() = default;
 
         virtual const Entry & getEntry() const = 0;
 
-        virtual Entry & getEntry() = 0;
+        virtual size_t increasePriority(const CacheGuard::Lock &) = 0;
+
+        virtual void updateSize(int64_t size) = 0;
+
+        virtual void remove(const CacheGuard::Lock &) = 0;
 
         virtual void invalidate() = 0;
 
-        virtual void updateSize(int64_t size) = 0;
+        virtual QueueEntryType getType() const = 0;
     };
+    using IteratorPtr = std::shared_ptr<Iterator>;
 
-    using Iterator = std::shared_ptr<IIterator>;
-    using ConstIterator = std::shared_ptr<const IIterator>;
-
-    enum class IterationResult
-    {
-        BREAK,
-        CONTINUE,
-        REMOVE_AND_CONTINUE,
-    };
-    using IterateFunc = std::function<IterationResult(LockedKey &, const FileSegmentMetadataPtr &)>;
-
-    IFileCachePriority(size_t max_size_, size_t max_elements_) : max_size(max_size_), max_elements(max_elements_) {}
+    IFileCachePriority(size_t max_size_, size_t max_elements_);
 
     virtual ~IFileCachePriority() = default;
 
-    size_t getElementsLimit() const { return max_elements; }
+    size_t getElementsLimit(const CacheGuard::Lock &) const { return max_elements; }
 
-    size_t getSizeLimit() const { return max_size; }
+    size_t getSizeLimit(const CacheGuard::Lock &) const { return max_size; }
 
     virtual size_t getSize(const CacheGuard::Lock &) const = 0;
 
     virtual size_t getElementsCount(const CacheGuard::Lock &) const = 0;
 
-    virtual Iterator add(
-        KeyMetadataPtr key_metadata, size_t offset, size_t size, const CacheGuard::Lock &) = 0;
+    /// Throws exception if there is not enough size to fit it.
+    virtual IteratorPtr add( /// NOLINT
+        KeyMetadataPtr key_metadata,
+        size_t offset,
+        size_t size,
+        const CacheGuard::Lock &,
+        bool is_startup = false) = 0;
 
-    virtual void pop(const CacheGuard::Lock &) = 0;
-
-    virtual void removeAll(const CacheGuard::Lock &) = 0;
-
-    /// From lowest to highest priority.
-    virtual void iterate(IterateFunc && func, const CacheGuard::Lock &) = 0;
+    virtual bool canFit(size_t size, const CacheGuard::Lock &) const = 0;
 
     virtual void shuffle(const CacheGuard::Lock &) = 0;
 
-private:
-    const size_t max_size = 0;
-    const size_t max_elements = 0;
+    virtual std::vector<FileSegmentInfo> dump(const CacheGuard::Lock &) = 0;
+
+    using FinalizeEvictionFunc = std::function<void(const CacheGuard::Lock & lk)>;
+    virtual bool collectCandidatesForEviction(
+        size_t size,
+        FileCacheReserveStat & stat,
+        EvictionCandidates & res,
+        IFileCachePriority::IteratorPtr reservee,
+        FinalizeEvictionFunc & finalize_eviction_func,
+        const CacheGuard::Lock &) = 0;
+
+    virtual bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock &) = 0;
+
+protected:
+    size_t max_size = 0;
+    size_t max_elements = 0;
 };
 
 }
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.cpp b/src/Interpreters/Cache/LRUFileCachePriority.cpp
index 5ecea95b1db..2155d2e1f8b 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.cpp
+++ b/src/Interpreters/Cache/LRUFileCachePriority.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/Cache/LRUFileCachePriority.h>
 #include <Interpreters/Cache/FileCache.h>
+#include <Interpreters/Cache/EvictionCandidates.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/randomSeed.h>
 #include <Common/logger_useful.h>
@@ -11,6 +12,15 @@ namespace CurrentMetrics
     extern const Metric FilesystemCacheElements;
 }
 
+namespace ProfileEvents
+{
+    extern const Event FilesystemCacheEvictionSkippedFileSegments;
+    extern const Event FilesystemCacheEvictionTries;
+    extern const Event FilesystemCacheEvictMicroseconds;
+    extern const Event FilesystemCacheEvictedBytes;
+    extern const Event FilesystemCacheEvictedFileSegments;
+}
+
 namespace DB
 {
 
@@ -19,26 +29,31 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
-IFileCachePriority::Iterator LRUFileCachePriority::add(
+IFileCachePriority::IteratorPtr LRUFileCachePriority::add( /// NOLINT
     KeyMetadataPtr key_metadata,
     size_t offset,
     size_t size,
-    const CacheGuard::Lock &)
+    const CacheGuard::Lock & lock,
+    bool /* is_startup */)
 {
-    const auto & key = key_metadata->key;
-    if (size == 0)
+    return std::make_shared<LRUIterator>(add(Entry(key_metadata->key, offset, size, key_metadata), lock));
+}
+
+LRUFileCachePriority::LRUIterator LRUFileCachePriority::add(Entry && entry, const CacheGuard::Lock & lock)
+{
+    if (entry.size == 0)
     {
         throw Exception(
             ErrorCodes::LOGICAL_ERROR,
             "Adding zero size entries to LRU queue is not allowed "
-            "(key: {}, offset: {})", key, offset);
+            "(key: {}, offset: {})", entry.key, entry.offset);
     }
 
 #ifndef NDEBUG
-    for (const auto & entry : queue)
+    for (const auto & queue_entry : queue)
     {
         /// entry.size == 0 means entry was invalidated.
-        if (entry.size != 0 && entry.key == key && entry.offset == offset)
+        if (queue_entry.size != 0 && queue_entry.key == entry.key && queue_entry.offset == entry.offset)
             throw Exception(
                 ErrorCodes::LOGICAL_ERROR,
                 "Attempt to add duplicate queue entry to queue. "
@@ -47,42 +62,28 @@ IFileCachePriority::Iterator LRUFileCachePriority::add(
     }
 #endif
 
-    const auto & size_limit = getSizeLimit();
-    if (size_limit && current_size + size > size_limit)
+    const auto & size_limit = getSizeLimit(lock);
+    if (size_limit && current_size + entry.size > size_limit)
     {
         throw Exception(
             ErrorCodes::LOGICAL_ERROR,
             "Not enough space to add {}:{} with size {}: current size: {}/{}",
-            key, offset, size, current_size, size_limit);
+            entry.key, entry.offset, entry.size, current_size, size_limit);
     }
 
-    auto iter = queue.insert(queue.end(), Entry(key, offset, size, key_metadata));
+    auto iterator = queue.insert(queue.end(), entry);
 
-    updateSize(size);
+    updateSize(entry.size);
     updateElementsCount(1);
 
     LOG_TEST(
         log, "Added entry into LRU queue, key: {}, offset: {}, size: {}",
-        key, offset, size);
+        entry.key, entry.offset, entry.size);
 
-    return std::make_shared<LRUFileCacheIterator>(this, iter);
+    return LRUIterator(this, iterator);
 }
 
-void LRUFileCachePriority::removeAll(const CacheGuard::Lock &)
-{
-    LOG_TEST(log, "Removed all entries from LRU queue");
-
-    updateSize(-current_size);
-    updateElementsCount(-current_elements_num);
-    queue.clear();
-}
-
-void LRUFileCachePriority::pop(const CacheGuard::Lock &)
-{
-    remove(queue.begin());
-}
-
-LRUFileCachePriority::LRUQueueIterator LRUFileCachePriority::remove(LRUQueueIterator it)
+LRUFileCachePriority::LRUQueue::iterator LRUFileCachePriority::remove(LRUQueue::iterator it, const CacheGuard::Lock &)
 {
     /// If size is 0, entry is invalidated, current_elements_num was already updated.
     if (it->size)
@@ -110,30 +111,49 @@ void LRUFileCachePriority::updateElementsCount(int64_t num)
     CurrentMetrics::add(CurrentMetrics::FilesystemCacheElements, num);
 }
 
-
-LRUFileCachePriority::LRUFileCacheIterator::LRUFileCacheIterator(
+LRUFileCachePriority::LRUIterator::LRUIterator(
     LRUFileCachePriority * cache_priority_,
-    LRUFileCachePriority::LRUQueueIterator queue_iter_)
+    LRUQueue::iterator iterator_)
     : cache_priority(cache_priority_)
-    , queue_iter(queue_iter_)
+    , iterator(iterator_)
 {
 }
 
-void LRUFileCachePriority::iterate(IterateFunc && func, const CacheGuard::Lock &)
+LRUFileCachePriority::LRUIterator::LRUIterator(const LRUIterator & other)
+{
+    *this = other;
+}
+
+LRUFileCachePriority::LRUIterator & LRUFileCachePriority::LRUIterator::operator =(const LRUIterator & other)
+{
+    if (this == &other)
+        return *this;
+
+    cache_priority = other.cache_priority;
+    iterator = other.iterator;
+    return *this;
+}
+
+bool LRUFileCachePriority::LRUIterator::operator ==(const LRUIterator & other) const
+{
+    return cache_priority == other.cache_priority && iterator == other.iterator;
+}
+
+void LRUFileCachePriority::iterate(IterateFunc && func, const CacheGuard::Lock & lock)
 {
     for (auto it = queue.begin(); it != queue.end();)
     {
         auto locked_key = it->key_metadata->tryLock();
         if (!locked_key || it->size == 0)
         {
-            it = remove(it);
+            it = remove(it, lock);
             continue;
         }
 
         auto metadata = locked_key->tryGetByOffset(it->offset);
         if (!metadata)
         {
-            it = remove(it);
+            it = remove(it, lock);
             continue;
         }
 
@@ -160,63 +180,212 @@ void LRUFileCachePriority::iterate(IterateFunc && func, const CacheGuard::Lock &
             }
             case IterationResult::REMOVE_AND_CONTINUE:
             {
-                it = remove(it);
+                it = remove(it, lock);
                 break;
             }
         }
     }
 }
 
-void LRUFileCachePriority::LRUFileCacheIterator::remove(const CacheGuard::Lock &)
+bool LRUFileCachePriority::canFit(size_t size, const CacheGuard::Lock & lock) const
 {
-    checkUsable();
-    cache_priority->remove(queue_iter);
-    queue_iter = LRUQueueIterator{};
+    return canFit(size, 0, 0, lock);
 }
 
-void LRUFileCachePriority::LRUFileCacheIterator::invalidate()
+bool LRUFileCachePriority::canFit(
+    size_t size,
+    size_t released_size_assumption,
+    size_t released_elements_assumption,
+    const CacheGuard::Lock &) const
 {
-    checkUsable();
+    return (max_size == 0 || (current_size + size - released_size_assumption <= max_size))
+        && (max_elements == 0 || current_elements_num + 1 - released_elements_assumption <= max_elements);
+}
+
+bool LRUFileCachePriority::collectCandidatesForEviction(
+    size_t size,
+    FileCacheReserveStat & stat,
+    EvictionCandidates & res,
+    IFileCachePriority::IteratorPtr,
+    FinalizeEvictionFunc &,
+    const CacheGuard::Lock & lock)
+{
+    if (canFit(size, lock))
+        return true;
+
+    ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictionTries);
+
+    IterateFunc iterate_func = [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
+    {
+        const auto & file_segment = segment_metadata->file_segment;
+        chassert(file_segment->assertCorrectness());
+
+        if (segment_metadata->releasable())
+        {
+            res.add(locked_key, segment_metadata);
+            stat.update(segment_metadata->size(), file_segment->getKind(), true);
+        }
+        else
+        {
+            stat.update(segment_metadata->size(), file_segment->getKind(), false);
+            ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictionSkippedFileSegments);
+        }
+
+        return IterationResult::CONTINUE;
+    };
+
+    auto can_fit = [&]
+    {
+        return canFit(size, stat.stat.releasable_size, stat.stat.releasable_count, lock);
+    };
+
+    iterate([&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
+    {
+        return can_fit() ? IterationResult::BREAK : iterate_func(locked_key, segment_metadata);
+    }, lock);
+
+    return can_fit();
+}
+
+LRUFileCachePriority::LRUIterator LRUFileCachePriority::move(LRUIterator & it, LRUFileCachePriority & other, const CacheGuard::Lock &)
+{
+    const auto & entry = it.getEntry();
+    if (entry.size == 0)
+    {
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Adding zero size entries to LRU queue is not allowed "
+            "(key: {}, offset: {})", entry.key, entry.offset);
+    }
+#ifndef NDEBUG
+    for (const auto & queue_entry : queue)
+    {
+        /// entry.size == 0 means entry was invalidated.
+        if (queue_entry.size != 0 && queue_entry.key == entry.key && queue_entry.offset == entry.offset)
+            throw Exception(
+                ErrorCodes::LOGICAL_ERROR,
+                "Attempt to add duplicate queue entry to queue. "
+                "(Key: {}, offset: {}, size: {})",
+                entry.key, entry.offset, entry.size);
+    }
+#endif
+
+    queue.splice(queue.end(), other.queue, it.iterator);
+
+    updateSize(entry.size);
+    updateElementsCount(1);
+
+    other.updateSize(-entry.size);
+    other.updateElementsCount(-1);
+    return LRUIterator(this, it.iterator);
+}
+
+std::vector<FileSegmentInfo> LRUFileCachePriority::dump(const CacheGuard::Lock & lock)
+{
+    std::vector<FileSegmentInfo> res;
+    iterate([&](LockedKey &, const FileSegmentMetadataPtr & segment_metadata)
+    {
+        res.emplace_back(FileSegment::getInfo(segment_metadata->file_segment));
+        return IterationResult::CONTINUE;
+    }, lock);
+    return res;
+}
+
+bool LRUFileCachePriority::modifySizeLimits(
+    size_t max_size_, size_t max_elements_, double /* size_ratio_ */, const CacheGuard::Lock & lock)
+{
+    if (max_size == max_size_ && max_elements == max_elements_)
+        return false; /// Nothing to change.
+
+    auto check_limits_satisfied = [&]()
+    {
+        return (max_size_ == 0 || current_size <= max_size_)
+            && (max_elements_ == 0 || current_elements_num <= max_elements_);
+    };
+
+    if (check_limits_satisfied())
+    {
+        max_size = max_size_;
+        max_elements = max_elements_;
+        return true;
+    }
+
+    auto iterate_func = [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
+    {
+        chassert(segment_metadata->file_segment->assertCorrectness());
+
+        if (!segment_metadata->releasable())
+            return IterationResult::CONTINUE;
+
+        auto segment = segment_metadata->file_segment;
+        locked_key.removeFileSegment(segment->offset(), segment->lock());
+
+        ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedFileSegments);
+        ProfileEvents::increment(ProfileEvents::FilesystemCacheEvictedBytes, segment->getDownloadedSize());
+        return IterationResult::REMOVE_AND_CONTINUE;
+    };
+
+    auto timer = DB::CurrentThread::getProfileEvents().timer(ProfileEvents::FilesystemCacheEvictMicroseconds);
+    iterate(
+        [&](LockedKey & locked_key, const FileSegmentMetadataPtr & segment_metadata)
+        { return check_limits_satisfied() ? IterationResult::BREAK : iterate_func(locked_key, segment_metadata); },
+        lock);
+
+    max_size = max_size_;
+    max_elements = max_elements_;
+    return true;
+}
+
+void LRUFileCachePriority::LRUIterator::remove(const CacheGuard::Lock & lock)
+{
+    assertValid();
+    cache_priority->remove(iterator, lock);
+    iterator = LRUQueue::iterator{};
+}
+
+void LRUFileCachePriority::LRUIterator::invalidate()
+{
+    assertValid();
 
     LOG_TEST(
         cache_priority->log,
         "Invalidating entry in LRU queue. Key: {}, offset: {}, previous size: {}",
-        queue_iter->key, queue_iter->offset, queue_iter->size);
+        iterator->key, iterator->offset, iterator->size);
 
-    cache_priority->updateSize(-queue_iter->size);
+    cache_priority->updateSize(-iterator->size);
     cache_priority->updateElementsCount(-1);
-    queue_iter->size = 0;
+    iterator->size = 0;
 }
 
-void LRUFileCachePriority::LRUFileCacheIterator::updateSize(int64_t size)
+void LRUFileCachePriority::LRUIterator::updateSize(int64_t size)
 {
-    checkUsable();
+    assertValid();
 
     LOG_TEST(
         cache_priority->log,
         "Update size with {} in LRU queue for key: {}, offset: {}, previous size: {}",
-        size, queue_iter->key, queue_iter->offset, queue_iter->size);
+        size, iterator->key, iterator->offset, iterator->size);
 
     cache_priority->updateSize(size);
-    queue_iter->size += size;
+    iterator->size += size;
 }
 
-size_t LRUFileCachePriority::LRUFileCacheIterator::use(const CacheGuard::Lock &)
+size_t LRUFileCachePriority::LRUIterator::increasePriority(const CacheGuard::Lock &)
 {
-    checkUsable();
-    cache_priority->queue.splice(cache_priority->queue.end(), cache_priority->queue, queue_iter);
-    return ++queue_iter->hits;
+    assertValid();
+    cache_priority->queue.splice(cache_priority->queue.end(), cache_priority->queue, iterator);
+    return ++iterator->hits;
 }
 
-void LRUFileCachePriority::LRUFileCacheIterator::checkUsable() const
+void LRUFileCachePriority::LRUIterator::assertValid() const
 {
-    if (queue_iter == LRUQueueIterator{})
+    if (iterator == LRUQueue::iterator{})
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Attempt to use invalid iterator");
 }
 
 void LRUFileCachePriority::shuffle(const CacheGuard::Lock &)
 {
-    std::vector<LRUQueueIterator> its;
+    std::vector<LRUQueue::iterator> its;
     its.reserve(queue.size());
     for (auto it = queue.begin(); it != queue.end(); ++it)
         its.push_back(it);
diff --git a/src/Interpreters/Cache/LRUFileCachePriority.h b/src/Interpreters/Cache/LRUFileCachePriority.h
index 89f86961811..ed6ec405395 100644
--- a/src/Interpreters/Cache/LRUFileCachePriority.h
+++ b/src/Interpreters/Cache/LRUFileCachePriority.h
@@ -6,43 +6,50 @@
 #include <Common/logger_useful.h>
 #include "Interpreters/Cache/Guards.h"
 
-namespace CurrentMetrics
-{
-    extern const Metric FilesystemCacheSizeLimit;
-}
-
 namespace DB
 {
 
 /// Based on the LRU algorithm implementation, the record with the lowest priority is stored at
 /// the head of the queue, and the record with the highest priority is stored at the tail.
-class LRUFileCachePriority : public IFileCachePriority
+class LRUFileCachePriority final : public IFileCachePriority
 {
 private:
-    class LRUFileCacheIterator;
+    class LRUIterator;
     using LRUQueue = std::list<Entry>;
-    using LRUQueueIterator = typename LRUQueue::iterator;
+    friend class SLRUFileCachePriority;
 
 public:
-    LRUFileCachePriority(size_t max_size_, size_t max_elements_) : IFileCachePriority(max_size_, max_elements_)
-    {
-        CurrentMetrics::set(CurrentMetrics::FilesystemCacheSizeLimit, max_size_);
-    }
+    LRUFileCachePriority(size_t max_size_, size_t max_elements_) : IFileCachePriority(max_size_, max_elements_) {}
 
     size_t getSize(const CacheGuard::Lock &) const override { return current_size; }
 
     size_t getElementsCount(const CacheGuard::Lock &) const override { return current_elements_num; }
 
-    Iterator add(KeyMetadataPtr key_metadata, size_t offset, size_t size, const CacheGuard::Lock &) override;
+    bool canFit(size_t size, const CacheGuard::Lock &) const override;
 
-    void pop(const CacheGuard::Lock &) override;
+    IteratorPtr add( /// NOLINT
+        KeyMetadataPtr key_metadata,
+        size_t offset,
+        size_t size,
+        const CacheGuard::Lock &,
+        bool is_startup = false) override;
 
-    void removeAll(const CacheGuard::Lock &) override;
-
-    void iterate(IterateFunc && func, const CacheGuard::Lock &) override;
+    bool collectCandidatesForEviction(
+        size_t size,
+        FileCacheReserveStat & stat,
+        EvictionCandidates & res,
+        IFileCachePriority::IteratorPtr reservee,
+        FinalizeEvictionFunc & finalize_eviction_func,
+        const CacheGuard::Lock &) override;
 
     void shuffle(const CacheGuard::Lock &) override;
 
+    std::vector<FileSegmentInfo> dump(const CacheGuard::Lock &) override;
+
+    void pop(const CacheGuard::Lock & lock) { remove(queue.begin(), lock); }
+
+    bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock &) override;
+
 private:
     void updateElementsCount(int64_t num);
     void updateSize(int64_t size);
@@ -55,21 +62,38 @@ private:
     /// because of invalidated entries.
     std::atomic<size_t> current_elements_num = 0;
 
-    LRUQueueIterator remove(LRUQueueIterator it);
+    bool canFit(size_t size, size_t released_size_assumption, size_t released_elements_assumption, const CacheGuard::Lock &) const;
+
+    LRUQueue::iterator remove(LRUQueue::iterator it, const CacheGuard::Lock &);
+
+    enum class IterationResult
+    {
+        BREAK,
+        CONTINUE,
+        REMOVE_AND_CONTINUE,
+    };
+    using IterateFunc = std::function<IterationResult(LockedKey &, const FileSegmentMetadataPtr &)>;
+    void iterate(IterateFunc && func, const CacheGuard::Lock &);
+
+    LRUIterator move(LRUIterator & it, LRUFileCachePriority & other, const CacheGuard::Lock &);
+    LRUIterator add(Entry && entry, const CacheGuard::Lock &);
 };
 
-class LRUFileCachePriority::LRUFileCacheIterator : public IFileCachePriority::IIterator
+class LRUFileCachePriority::LRUIterator : public IFileCachePriority::Iterator
 {
+    friend class LRUFileCachePriority;
+    friend class SLRUFileCachePriority;
+
 public:
-    LRUFileCacheIterator(
-        LRUFileCachePriority * cache_priority_,
-        LRUFileCachePriority::LRUQueueIterator queue_iter_);
+    LRUIterator(LRUFileCachePriority * cache_priority_, LRUQueue::iterator iterator_);
 
-    const Entry & getEntry() const override { return *queue_iter; }
+    LRUIterator(const LRUIterator & other);
+    LRUIterator & operator =(const LRUIterator & other);
+    bool operator ==(const LRUIterator & other) const;
 
-    Entry & getEntry() override { return *queue_iter; }
+    const Entry & getEntry() const override { return *iterator; }
 
-    size_t use(const CacheGuard::Lock &) override;
+    size_t increasePriority(const CacheGuard::Lock &) override;
 
     void remove(const CacheGuard::Lock &) override;
 
@@ -77,11 +101,13 @@ public:
 
     void updateSize(int64_t size) override;
 
+    QueueEntryType getType() const override { return QueueEntryType::LRU; }
+
 private:
-    void checkUsable() const;
+    void assertValid() const;
 
     LRUFileCachePriority * cache_priority;
-    mutable LRUFileCachePriority::LRUQueueIterator queue_iter;
+    mutable LRUQueue::iterator iterator;
 };
 
 }
diff --git a/src/Interpreters/Cache/Metadata.cpp b/src/Interpreters/Cache/Metadata.cpp
index ffc0102959f..231c3d4a8d6 100644
--- a/src/Interpreters/Cache/Metadata.cpp
+++ b/src/Interpreters/Cache/Metadata.cpp
@@ -134,11 +134,12 @@ std::string KeyMetadata::getFileSegmentPath(const FileSegment & file_segment) co
         / CacheMetadata::getFileNameForFileSegment(file_segment.offset(), file_segment.getKind());
 }
 
-CacheMetadata::CacheMetadata(const std::string & path_, size_t background_download_queue_size_limit_)
+CacheMetadata::CacheMetadata(const std::string & path_, size_t background_download_queue_size_limit_, size_t background_download_threads_)
     : path(path_)
     , cleanup_queue(std::make_shared<CleanupQueue>())
     , download_queue(std::make_shared<DownloadQueue>(background_download_queue_size_limit_))
     , log(&Poco::Logger::get("CacheMetadata"))
+    , download_threads_num(background_download_threads_)
 {
 }
 
@@ -351,7 +352,10 @@ CacheMetadata::removeEmptyKey(
     try
     {
         if (fs::exists(key_directory))
+        {
             fs::remove_all(key_directory);
+            LOG_TEST(log, "Directory ({}) for key {} removed", key_directory.string(), key);
+        }
     }
     catch (...)
     {
@@ -364,7 +368,10 @@ CacheMetadata::removeEmptyKey(
     {
         std::unique_lock mutex(key_prefix_directory_mutex);
         if (fs::exists(key_prefix_directory) && fs::is_empty(key_prefix_directory))
+        {
             fs::remove(key_prefix_directory);
+            LOG_TEST(log, "Prefix directory ({}) for key {} removed", key_prefix_directory.string(), key);
+        }
     }
     catch (...)
     {
@@ -458,11 +465,6 @@ void CacheMetadata::cleanupThreadFunc()
     }
 }
 
-void CacheMetadata::cancelCleanup()
-{
-    cleanup_queue->cancel();
-}
-
 class DownloadQueue
 {
 friend struct CacheMetadata;
@@ -473,7 +475,7 @@ public:
     {
         {
             std::lock_guard lock(mutex);
-            if (cancelled || (queue_size_limit && queue.size() == queue_size_limit))
+            if (cancelled || (queue_size_limit && queue.size() >= queue_size_limit))
                 return false;
             queue.push(DownloadInfo{file_segment->key(), file_segment->offset(), file_segment});
         }
@@ -483,6 +485,8 @@ public:
         return true;
     }
 
+    bool setQueueLimit(size_t size) { return queue_size_limit.exchange(size) != size; }
+
 private:
     void cancel()
     {
@@ -493,8 +497,8 @@ private:
         cv.notify_all();
     }
 
-    const size_t queue_size_limit;
-    std::mutex mutex;
+    std::atomic<size_t> queue_size_limit;
+    mutable std::mutex mutex;
     std::condition_variable cv;
     bool cancelled = false;
 
@@ -515,7 +519,7 @@ private:
     std::queue<DownloadInfo> queue;
 };
 
-void CacheMetadata::downloadThreadFunc()
+void CacheMetadata::downloadThreadFunc(const bool & stop_flag)
 {
     std::optional<Memory<>> memory;
     while (true)
@@ -526,13 +530,13 @@ void CacheMetadata::downloadThreadFunc()
 
         {
             std::unique_lock lock(download_queue->mutex);
-            if (download_queue->cancelled)
+            if (download_queue->cancelled || stop_flag)
                 return;
 
             if (download_queue->queue.empty())
             {
-                download_queue->cv.wait(lock, [&](){ return download_queue->cancelled || !download_queue->queue.empty(); });
-                if (download_queue->cancelled)
+                download_queue->cv.wait(lock, [&](){ return download_queue->cancelled || !download_queue->queue.empty() || stop_flag; });
+                if (download_queue->cancelled || stop_flag)
                     return;
             }
 
@@ -607,6 +611,11 @@ void CacheMetadata::downloadThreadFunc()
     }
 }
 
+bool CacheMetadata::setBackgroundDownloadQueueSizeLimit(size_t size)
+{
+    return download_queue->setQueueLimit(size);
+}
+
 void CacheMetadata::downloadImpl(FileSegment & file_segment, std::optional<Memory<>> & memory)
 {
     LOG_TEST(
@@ -670,9 +679,85 @@ void CacheMetadata::downloadImpl(FileSegment & file_segment, std::optional<Memor
     LOG_TEST(log, "Downloaded file segment: {}", file_segment.getInfoForLog());
 }
 
-void CacheMetadata::cancelDownload()
+void CacheMetadata::startup()
+{
+    download_threads.reserve(download_threads_num);
+    for (size_t i = 0; i < download_threads_num; ++i)
+    {
+        download_threads.emplace_back(std::make_shared<DownloadThread>());
+        download_threads.back()->thread = std::make_unique<ThreadFromGlobalPool>([this, thread = download_threads.back()] { downloadThreadFunc(thread->stop_flag); });
+    }
+    cleanup_thread = std::make_unique<ThreadFromGlobalPool>([this]{ cleanupThreadFunc(); });
+}
+
+void CacheMetadata::shutdown()
 {
     download_queue->cancel();
+    cleanup_queue->cancel();
+
+    for (auto & download_thread : download_threads)
+    {
+        if (download_thread->thread && download_thread->thread->joinable())
+            download_thread->thread->join();
+    }
+    if (cleanup_thread && cleanup_thread->joinable())
+        cleanup_thread->join();
+}
+
+bool CacheMetadata::isBackgroundDownloadEnabled()
+{
+    return download_threads_num;
+}
+
+bool CacheMetadata::setBackgroundDownloadThreads(size_t threads_num)
+{
+    if (threads_num == download_threads_num)
+        return false;
+
+    SCOPE_EXIT({ download_threads_num = download_threads.size(); });
+
+    if (threads_num > download_threads_num)
+    {
+        size_t add_threads = threads_num - download_threads_num;
+        for (size_t i = 0; i < add_threads; ++i)
+        {
+            download_threads.emplace_back(std::make_shared<DownloadThread>());
+            try
+            {
+                download_threads.back()->thread = std::make_unique<ThreadFromGlobalPool>(
+                    [this, thread = download_threads.back()] { downloadThreadFunc(thread->stop_flag); });
+            }
+            catch (...)
+            {
+                download_threads.pop_back();
+                throw;
+            }
+        }
+    }
+    else if (threads_num < download_threads_num)
+    {
+        size_t remove_threads = download_threads_num - threads_num;
+
+        {
+            std::lock_guard lock(download_queue->mutex);
+            for (size_t i = 0; i < remove_threads; ++i)
+                download_threads[download_threads.size() - 1 - i]->stop_flag = true;
+        }
+
+        download_queue->cv.notify_all();
+
+        for (size_t i = 0; i < remove_threads; ++i)
+        {
+            chassert(download_threads.back()->stop_flag);
+
+            auto & thread = download_threads.back()->thread;
+            if (thread && thread->joinable())
+                thread->join();
+
+            download_threads.pop_back();
+        }
+    }
+    return true;
 }
 
 LockedKey::LockedKey(std::shared_ptr<KeyMetadata> key_metadata_)
@@ -927,9 +1012,10 @@ std::string LockedKey::toString() const
     return result;
 }
 
-FileSegments LockedKey::sync()
+
+std::vector<FileSegment::Info> LockedKey::sync()
 {
-    FileSegments broken;
+    std::vector<FileSegment::Info> broken;
     for (auto it = key_metadata->begin(); it != key_metadata->end();)
     {
         if (it->second->evicting() || !it->second->releasable())
@@ -960,7 +1046,7 @@ FileSegments LockedKey::sync()
                 "File segment has DOWNLOADED state, but file does not exist ({})",
                 file_segment->getInfoForLog());
 
-            broken.push_back(FileSegment::getSnapshot(file_segment));
+            broken.push_back(FileSegment::getInfo(file_segment));
             it = removeFileSegment(file_segment->offset(), file_segment->lock(), /* can_be_broken */true);
             continue;
         }
@@ -979,7 +1065,7 @@ FileSegments LockedKey::sync()
             "File segment has unexpected size. Having {}, expected {} ({})",
             actual_size, expected_size, file_segment->getInfoForLog());
 
-        broken.push_back(FileSegment::getSnapshot(file_segment));
+        broken.push_back(FileSegment::getInfo(file_segment));
         it = removeFileSegment(file_segment->offset(), file_segment->lock(), /* can_be_broken */false);
     }
     return broken;
diff --git a/src/Interpreters/Cache/Metadata.h b/src/Interpreters/Cache/Metadata.h
index 2e72396776a..0770a165ffa 100644
--- a/src/Interpreters/Cache/Metadata.h
+++ b/src/Interpreters/Cache/Metadata.h
@@ -5,6 +5,7 @@
 #include <Interpreters/Cache/FileCacheKey.h>
 #include <Interpreters/Cache/FileSegment.h>
 #include <Interpreters/Cache/FileCache_fwd_internal.h>
+#include <Common/ThreadPool.h>
 #include <shared_mutex>
 
 namespace DB
@@ -29,7 +30,7 @@ struct FileSegmentMetadata : private boost::noncopyable
 
     bool evicting() const { return removal_candidate.load(); }
 
-    Priority::Iterator getQueueIterator() const { return file_segment->getQueueIterator(); }
+    Priority::IteratorPtr getQueueIterator() const { return file_segment->getQueueIterator(); }
 
     FileSegmentPtr file_segment;
     std::atomic<bool> removal_candidate{false};
@@ -102,7 +103,9 @@ public:
     using Key = FileCacheKey;
     using IterateFunc = std::function<void(LockedKey &)>;
 
-    explicit CacheMetadata(const std::string & path_, size_t background_download_queue_size_limit_);
+    explicit CacheMetadata(const std::string & path_, size_t background_download_queue_size_limit_, size_t background_download_threads_);
+
+    void startup();
 
     const String & getBaseDirectory() const { return path; }
 
@@ -115,6 +118,7 @@ public:
     static String getFileNameForFileSegment(size_t offset, FileSegmentKind segment_kind);
 
     void iterate(IterateFunc && func);
+
     bool isEmpty() const;
 
     enum class KeyNotFoundPolicy
@@ -138,21 +142,13 @@ public:
     void removeKey(const Key & key, bool if_exists, bool if_releasable);
     void removeAllKeys(bool if_releasable);
 
-    void cancelCleanup();
+    void shutdown();
 
-    /// Firstly, this cleanup does not delete cache files,
-    /// but only empty keys from cache_metadata_map and key (prefix) directories from fs.
-    /// Secondly, it deletes those only if arose as a result of
-    /// (1) eviction in FileCache::tryReserve();
-    /// (2) removal of cancelled non-downloaded file segments after FileSegment::complete().
-    /// which does not include removal of cache files because of FileCache::removeKey/removeAllKeys,
-    /// triggered by removal of source files from objects storage.
-    /// E.g. number of elements submitted to background cleanup should remain low.
-    void cleanupThreadFunc();
+    bool setBackgroundDownloadThreads(size_t threads_num);
+    size_t getBackgroundDownloadThreads() const { return download_threads.size(); }
+    bool setBackgroundDownloadQueueSizeLimit(size_t size);
 
-    void downloadThreadFunc();
-
-    void cancelDownload();
+    bool isBackgroundDownloadEnabled();
 
 private:
     const std::string path; /// Cache base path
@@ -172,6 +168,16 @@ private:
     static constexpr size_t buckets_num = 1024;
     std::vector<MetadataBucket> metadata_buckets{buckets_num};
 
+    struct DownloadThread
+    {
+        std::unique_ptr<ThreadFromGlobalPool> thread;
+        bool stop_flag{false};
+    };
+    std::vector<std::shared_ptr<DownloadThread>> download_threads;
+    std::atomic<size_t> download_threads_num;
+
+    std::unique_ptr<ThreadFromGlobalPool> cleanup_thread;
+
     MetadataBucket & getMetadataBucket(const Key & key);
     void downloadImpl(FileSegment & file_segment, std::optional<Memory<>> & memory);
     MetadataBucket::iterator removeEmptyKey(
@@ -179,6 +185,18 @@ private:
         MetadataBucket::iterator it,
         LockedKey &,
         const CacheMetadataGuard::Lock &);
+
+    void downloadThreadFunc(const bool & stop_flag);
+
+    /// Firstly, this cleanup does not delete cache files,
+    /// but only empty keys from cache_metadata_map and key (prefix) directories from fs.
+    /// Secondly, it deletes those only if arose as a result of
+    /// (1) eviction in FileCache::tryReserve();
+    /// (2) removal of cancelled non-downloaded file segments after FileSegment::complete().
+    /// which does not include removal of cache files because of FileCache::removeKey/removeAllKeys,
+    /// triggered by removal of source files from objects storage.
+    /// E.g. number of elements submitted to background cleanup should remain low.
+    void cleanupThreadFunc();
 };
 
 
@@ -243,7 +261,7 @@ struct LockedKey : private boost::noncopyable
 
     void markAsRemoved();
 
-    FileSegments sync();
+    std::vector<FileSegment::Info> sync();
 
     std::string toString() const;
 
diff --git a/src/Interpreters/Cache/QueryLimit.cpp b/src/Interpreters/Cache/QueryLimit.cpp
index 8b5b42cca1a..109e94b2971 100644
--- a/src/Interpreters/Cache/QueryLimit.cpp
+++ b/src/Interpreters/Cache/QueryLimit.cpp
@@ -95,7 +95,7 @@ void FileCacheQueryLimit::QueryContext::remove(
     records.erase({key, offset});
 }
 
-IFileCachePriority::Iterator FileCacheQueryLimit::QueryContext::tryGet(
+IFileCachePriority::IteratorPtr FileCacheQueryLimit::QueryContext::tryGet(
     const Key & key,
     size_t offset,
     const CacheGuard::Lock &)
diff --git a/src/Interpreters/Cache/QueryLimit.h b/src/Interpreters/Cache/QueryLimit.h
index f8247e8c520..cab1ccc63ba 100644
--- a/src/Interpreters/Cache/QueryLimit.h
+++ b/src/Interpreters/Cache/QueryLimit.h
@@ -27,7 +27,6 @@ public:
     public:
         using Key = FileCacheKey;
         using Priority = IFileCachePriority;
-        using PriorityIterator = IFileCachePriority::Iterator;
 
         QueryContext(size_t query_cache_size, bool recache_on_query_limit_exceeded_);
 
@@ -36,7 +35,7 @@ public:
 
         bool recacheOnFileCacheQueryLimitExceeded() const { return recache_on_query_limit_exceeded; }
 
-        IFileCachePriority::Iterator tryGet(
+        Priority::IteratorPtr tryGet(
             const Key & key,
             size_t offset,
             const CacheGuard::Lock &);
@@ -53,7 +52,7 @@ public:
             const CacheGuard::Lock &);
 
     private:
-        using Records = std::unordered_map<FileCacheKeyAndOffset, IFileCachePriority::Iterator, FileCacheKeyAndOffsetHash>;
+        using Records = std::unordered_map<FileCacheKeyAndOffset, Priority::IteratorPtr, FileCacheKeyAndOffsetHash>;
         Records records;
         LRUFileCachePriority priority;
         const bool recache_on_query_limit_exceeded;
diff --git a/src/Interpreters/Cache/SLRUFileCachePriority.cpp b/src/Interpreters/Cache/SLRUFileCachePriority.cpp
new file mode 100644
index 00000000000..8b46712731c
--- /dev/null
+++ b/src/Interpreters/Cache/SLRUFileCachePriority.cpp
@@ -0,0 +1,300 @@
+#include <Interpreters/Cache/SLRUFileCachePriority.h>
+#include <Interpreters/Cache/FileCache.h>
+#include <Interpreters/Cache/EvictionCandidates.h>
+#include <Common/CurrentMetrics.h>
+#include <Common/randomSeed.h>
+#include <Common/logger_useful.h>
+#include <Common/assert_cast.h>
+
+
+namespace DB
+{
+
+namespace
+{
+    size_t getRatio(size_t total, double ratio)
+    {
+        return static_cast<size_t>(total * std::clamp(ratio, 0.0, 1.0));
+    }
+}
+
+SLRUFileCachePriority::SLRUFileCachePriority(
+    size_t max_size_,
+    size_t max_elements_,
+    double size_ratio_)
+    : IFileCachePriority(max_size_, max_elements_)
+    , size_ratio(size_ratio_)
+    , protected_queue(LRUFileCachePriority(getRatio(max_size_, size_ratio), getRatio(max_elements_, size_ratio)))
+    , probationary_queue(LRUFileCachePriority(getRatio(max_size_, 1 - size_ratio), getRatio(max_elements_, 1 - size_ratio)))
+{
+    LOG_DEBUG(
+        log, "Using probationary queue size: {}, protected queue size: {}",
+        probationary_queue.max_size, protected_queue.max_elements);
+}
+
+size_t SLRUFileCachePriority::getSize(const CacheGuard::Lock & lock) const
+{
+    return protected_queue.getSize(lock) + probationary_queue.getSize(lock);
+}
+
+size_t SLRUFileCachePriority::getElementsCount(const CacheGuard::Lock & lock) const
+{
+    return protected_queue.getElementsCount(lock) + probationary_queue.getElementsCount(lock);
+}
+
+bool SLRUFileCachePriority::canFit(size_t size, const CacheGuard::Lock & lock) const
+{
+    return probationary_queue.canFit(size, lock) || protected_queue.canFit(size, lock);
+}
+
+IFileCachePriority::IteratorPtr SLRUFileCachePriority::add( /// NOLINT
+    KeyMetadataPtr key_metadata,
+    size_t offset,
+    size_t size,
+    const CacheGuard::Lock & lock,
+    bool is_startup)
+{
+    if (is_startup)
+    {
+        /// If it is server startup, we put entries in any queue it will fit in,
+        /// but with preference for probationary queue,
+        /// because we do not know the distribution between queues after server restart.
+        if (probationary_queue.canFit(size, lock))
+        {
+            auto lru_iterator = probationary_queue.add(Entry(key_metadata->key, offset, size, key_metadata), lock);
+            return std::make_shared<SLRUIterator>(this, std::move(lru_iterator), false);
+        }
+        else
+        {
+            auto lru_iterator = protected_queue.add(Entry(key_metadata->key, offset, size, key_metadata), lock);
+            return std::make_shared<SLRUIterator>(this, std::move(lru_iterator), true);
+        }
+    }
+    else
+    {
+        auto lru_iterator = probationary_queue.add(Entry(key_metadata->key, offset, size, key_metadata), lock);
+        return std::make_shared<SLRUIterator>(this, std::move(lru_iterator), false);
+    }
+}
+
+bool SLRUFileCachePriority::collectCandidatesForEviction(
+    size_t size,
+    FileCacheReserveStat & stat,
+    EvictionCandidates & res,
+    IFileCachePriority::IteratorPtr reservee,
+    FinalizeEvictionFunc & finalize_eviction_func,
+    const CacheGuard::Lock & lock)
+{
+    /// If `it` is nullptr, then it is the first space reservation attempt
+    /// for a corresponding file segment, so it will be directly put into probationary queue.
+    if (!reservee)
+    {
+        return probationary_queue.collectCandidatesForEviction(size, stat, res, reservee, finalize_eviction_func, lock);
+    }
+
+    /// If `it` not nullptr (e.g. is already in some queue),
+    /// we need to check in which queue (protected/probationary) it currently is
+    /// (in order to know where we need to free space).
+    if (!assert_cast<SLRUIterator *>(reservee.get())->is_protected)
+    {
+        return probationary_queue.collectCandidatesForEviction(size, stat, res, reservee, finalize_eviction_func, lock);
+    }
+
+    /// Entry is in protected queue.
+    /// Check if we have enough space in protected queue to fit a new size of entry.
+    /// `size` is the increment to the current entry.size we want to increase.
+    if (protected_queue.canFit(size, lock))
+        return true;
+
+    /// If not enough space - we need to "downgrade" lowest priority entries from protected
+    /// queue to probationary queue.
+    /// The amount of such "downgraded" entries is equal to the amount
+    /// required to make space for additionary `size` bytes for entry.
+    auto downgrade_candidates = std::make_shared<EvictionCandidates>();
+    FileCacheReserveStat downgrade_stat;
+    FinalizeEvictionFunc noop;
+
+    if (!protected_queue.collectCandidatesForEviction(size, downgrade_stat, *downgrade_candidates, reservee, noop, lock))
+        return false;
+
+    const size_t size_to_downgrade = downgrade_stat.stat.releasable_size;
+
+    if (!probationary_queue.canFit(size_to_downgrade, lock)
+        && !probationary_queue.collectCandidatesForEviction(size_to_downgrade, stat, res, reservee, noop, lock))
+        return false;
+
+    finalize_eviction_func = [=, this](const CacheGuard::Lock & lk) mutable
+    {
+        for (const auto & [key, key_candidates] : *downgrade_candidates)
+        {
+            for (const auto & candidate : key_candidates.candidates)
+            {
+                auto * candidate_it = assert_cast<SLRUIterator *>(candidate->getQueueIterator().get());
+                candidate_it->lru_iterator = probationary_queue.move(candidate_it->lru_iterator, protected_queue, lk);
+                candidate_it->is_protected = false;
+            }
+        }
+    };
+
+    return true;
+}
+
+void SLRUFileCachePriority::increasePriority(SLRUIterator & iterator, const CacheGuard::Lock & lock)
+{
+    /// If entry is already in protected queue,
+    /// we only need to increase its priority within the protected queue.
+    if (iterator.is_protected)
+    {
+        iterator.lru_iterator.increasePriority(lock);
+        return;
+    }
+
+    /// Entry is in probationary queue.
+    /// We need to move it to protected queue.
+    const size_t size = iterator.getEntry().size;
+    if (size > protected_queue.getSizeLimit(lock))
+    {
+        /// Entry size is bigger than the whole protected queue limit.
+        /// This is only possible if protected_queue_size_limit is less than max_file_segment_size,
+        /// which is not possible in any realistic cache configuration.
+        iterator.lru_iterator.increasePriority(lock);
+        return;
+    }
+
+    /// Check if there is enough space in protected queue to move entry there.
+    /// If not - we need to "downgrade" lowest priority entries from protected
+    /// queue to probationary queue.
+    EvictionCandidates downgrade_candidates;
+    FileCacheReserveStat downgrade_stat;
+    FinalizeEvictionFunc noop;
+
+    if (!protected_queue.collectCandidatesForEviction(size, downgrade_stat, downgrade_candidates, {}, noop, lock))
+    {
+        /// We cannot make space for entry to be moved to protected queue
+        /// (not enough releasable file segments).
+        /// Then just increase its priority within probationary queue.
+        iterator.lru_iterator.increasePriority(lock);
+        return;
+    }
+
+    /// The amount of such "downgraded" entries is equal to the amount
+    /// required to make space for entry we want to insert.
+    const size_t size_to_downgrade = downgrade_stat.stat.releasable_count;
+    size_t size_to_free = 0;
+    if (size_to_downgrade && size_to_downgrade > size)
+        size_to_free = size_to_downgrade - size;
+
+    /// Now we need to check if those "downgrade" candidates can actually
+    /// be moved to probationary queue.
+    EvictionCandidates eviction_candidates;
+    FileCacheReserveStat stat;
+
+    if (size_to_free)
+    {
+        if (!probationary_queue.collectCandidatesForEviction(size_to_free, stat, eviction_candidates, {}, noop, lock))
+        {
+            /// "downgrade" candidates cannot be moved to probationary queue,
+            /// so entry cannot be moved to protected queue as well.
+            /// Then just increase its priority within probationary queue.
+            iterator.lru_iterator.increasePriority(lock);
+            return;
+        }
+        /// Make space for "downgrade" candidates.
+        eviction_candidates.evict(nullptr, lock);
+    }
+
+    /// All checks passed, now we can move downgrade candidates to
+    /// probationary queue and our entry to protected queue.
+    Entry entry_copy = iterator.getEntry();
+    iterator.lru_iterator.remove(lock);
+
+    for (const auto & [key, key_candidates] : downgrade_candidates)
+    {
+        for (const auto & candidate : key_candidates.candidates)
+        {
+            auto * candidate_it = assert_cast<SLRUIterator *>(candidate->getQueueIterator().get());
+            candidate_it->lru_iterator = probationary_queue.move(candidate_it->lru_iterator, protected_queue, lock);
+            candidate_it->is_protected = false;
+        }
+    }
+
+    iterator.lru_iterator = protected_queue.add(std::move(entry_copy), lock);
+    iterator.is_protected = true;
+}
+
+std::vector<FileSegmentInfo> SLRUFileCachePriority::dump(const CacheGuard::Lock & lock)
+{
+    auto res = probationary_queue.dump(lock);
+    auto part_res = protected_queue.dump(lock);
+    res.insert(res.end(), part_res.begin(), part_res.end());
+    return res;
+}
+
+void SLRUFileCachePriority::shuffle(const CacheGuard::Lock & lock)
+{
+    protected_queue.shuffle(lock);
+    probationary_queue.shuffle(lock);
+}
+
+bool SLRUFileCachePriority::modifySizeLimits(
+    size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock & lock)
+{
+    if (max_size == max_size_ && max_elements == max_elements_ && size_ratio == size_ratio_)
+        return false; /// Nothing to change.
+
+    protected_queue.modifySizeLimits(getRatio(max_size_, size_ratio_), getRatio(max_elements_, size_ratio_), 0, lock);
+    probationary_queue.modifySizeLimits(getRatio(max_size_, 1 - size_ratio_), getRatio(max_elements_, 1 - size_ratio_), 0, lock);
+
+    max_size = max_size_;
+    max_elements = max_elements_;
+    size_ratio = size_ratio_;
+    return true;
+}
+
+SLRUFileCachePriority::SLRUIterator::SLRUIterator(
+    SLRUFileCachePriority * cache_priority_,
+    LRUFileCachePriority::LRUIterator && lru_iterator_,
+    bool is_protected_)
+    : cache_priority(cache_priority_)
+    , lru_iterator(lru_iterator_)
+    , is_protected(is_protected_)
+{
+}
+
+const SLRUFileCachePriority::Entry & SLRUFileCachePriority::SLRUIterator::getEntry() const
+{
+    assertValid();
+    return lru_iterator.getEntry();
+}
+
+size_t SLRUFileCachePriority::SLRUIterator::increasePriority(const CacheGuard::Lock & lock)
+{
+    assertValid();
+    cache_priority->increasePriority(*this, lock);
+    return getEntry().hits;
+}
+
+void SLRUFileCachePriority::SLRUIterator::updateSize(int64_t size)
+{
+    assertValid();
+    lru_iterator.updateSize(size);
+}
+
+void SLRUFileCachePriority::SLRUIterator::invalidate()
+{
+    assertValid();
+    lru_iterator.invalidate();
+}
+
+void SLRUFileCachePriority::SLRUIterator::remove(const CacheGuard::Lock & lock)
+{
+    assertValid();
+    lru_iterator.remove(lock);
+}
+
+void SLRUFileCachePriority::SLRUIterator::assertValid() const
+{
+    lru_iterator.assertValid();
+}
+
+}
diff --git a/src/Interpreters/Cache/SLRUFileCachePriority.h b/src/Interpreters/Cache/SLRUFileCachePriority.h
new file mode 100644
index 00000000000..b9ea246bc83
--- /dev/null
+++ b/src/Interpreters/Cache/SLRUFileCachePriority.h
@@ -0,0 +1,88 @@
+#pragma once
+
+#include <Interpreters/Cache/LRUFileCachePriority.h>
+#include <Common/logger_useful.h>
+
+
+namespace DB
+{
+
+/// Based on the SLRU algorithm implementation, the record with the lowest priority is stored at
+/// the head of the queue, and the record with the highest priority is stored at the tail.
+class SLRUFileCachePriority : public IFileCachePriority
+{
+private:
+    using LRUIterator = LRUFileCachePriority::LRUIterator;
+    using LRUQueue = std::list<Entry>;
+
+public:
+    class SLRUIterator;
+
+    SLRUFileCachePriority(size_t max_size_, size_t max_elements_, double size_ratio_);
+
+    size_t getSize(const CacheGuard::Lock & lock) const override;
+
+    size_t getElementsCount(const CacheGuard::Lock &) const override;
+
+    bool canFit(size_t size, const CacheGuard::Lock &) const override;
+
+    IteratorPtr add( /// NOLINT
+        KeyMetadataPtr key_metadata,
+        size_t offset,
+        size_t size,
+        const CacheGuard::Lock &,
+        bool is_startup = false) override;
+
+    bool collectCandidatesForEviction(
+        size_t size,
+        FileCacheReserveStat & stat,
+        EvictionCandidates & res,
+        IFileCachePriority::IteratorPtr reservee,
+        FinalizeEvictionFunc & finalize_eviction_func,
+        const CacheGuard::Lock &) override;
+
+    void shuffle(const CacheGuard::Lock &) override;
+
+    std::vector<FileSegmentInfo> dump(const CacheGuard::Lock &) override;
+
+    bool modifySizeLimits(size_t max_size_, size_t max_elements_, double size_ratio_, const CacheGuard::Lock &) override;
+
+private:
+    double size_ratio;
+    LRUFileCachePriority protected_queue;
+    LRUFileCachePriority probationary_queue;
+    Poco::Logger * log = &Poco::Logger::get("SLRUFileCachePriority");
+
+    void increasePriority(SLRUIterator & iterator, const CacheGuard::Lock & lock);
+};
+
+class SLRUFileCachePriority::SLRUIterator : public IFileCachePriority::Iterator
+{
+    friend class SLRUFileCachePriority;
+public:
+    SLRUIterator(
+        SLRUFileCachePriority * cache_priority_,
+        LRUIterator && lru_iterator_,
+        bool is_protected_);
+
+    const Entry & getEntry() const override;
+
+    size_t increasePriority(const CacheGuard::Lock &) override;
+
+    void remove(const CacheGuard::Lock &) override;
+
+    void invalidate() override;
+
+    void updateSize(int64_t size) override;
+
+    QueueEntryType getType() const override { return is_protected ? QueueEntryType::SLRU_Protected : QueueEntryType::SLRU_Probationary; }
+
+private:
+    void assertValid() const;
+
+    SLRUFileCachePriority * cache_priority;
+    mutable LRUIterator lru_iterator;
+    bool is_protected;
+};
+
+}
diff --git a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
index 15a80667cc4..73d93514db5 100644
--- a/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
+++ b/src/Interpreters/Cache/WriteBufferToFileSegment.cpp
@@ -7,6 +7,7 @@
 #include <base/scope_guard.h>
 
 #include <Common/logger_useful.h>
+#include <Common/formatReadable.h>
 
 namespace DB
 {
diff --git a/src/Interpreters/ClientInfo.h b/src/Interpreters/ClientInfo.h
index 81a81788d54..70524333047 100644
--- a/src/Interpreters/ClientInfo.h
+++ b/src/Interpreters/ClientInfo.h
@@ -2,7 +2,6 @@
 
 #include <Core/UUID.h>
 #include <Poco/Net/SocketAddress.h>
-#include <Poco/Net/NameValueCollection.h>
 #include <base/types.h>
 #include <Common/OpenTelemetryTraceContext.h>
 #include <Common/VersionNumber.h>
@@ -97,7 +96,6 @@ public:
 
     /// For mysql and postgresql
     UInt64 connection_id = 0;
-    Poco::Net::NameValueCollection headers;
 
     /// Comma separated list of forwarded IP addresses (from X-Forwarded-For for HTTP interface).
     /// It's expected that proxy appends the forwarded address to the end of the list.
diff --git a/src/Interpreters/Cluster.cpp b/src/Interpreters/Cluster.cpp
index 78c708b96da..b15f0e4b94e 100644
--- a/src/Interpreters/Cluster.cpp
+++ b/src/Interpreters/Cluster.cpp
@@ -488,8 +488,14 @@ Cluster::Cluster(const Poco::Util::AbstractConfiguration & config,
                     throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG, "Unknown element in config: {}", replica_key);
             }
 
-            addShard(settings, std::move(replica_addresses), /* treat_local_as_remote = */ false, current_shard_num,
-                     std::move(insert_paths), weight, internal_replication);
+            addShard(
+                settings,
+                replica_addresses,
+                /* treat_local_as_remote = */ false,
+                current_shard_num,
+                weight,
+                std::move(insert_paths),
+                internal_replication);
         }
         else
             throw Exception(ErrorCodes::UNKNOWN_ELEMENT_IN_CONFIG, "Unknown element in config: {}", key);
@@ -525,7 +531,7 @@ Cluster::Cluster(
 
         addresses_with_failover.emplace_back(current);
 
-        addShard(settings, std::move(current), params.treat_local_as_remote, current_shard_num, /* insert_paths= */ {}, /* weight= */ 1);
+        addShard(settings, std::move(current), params.treat_local_as_remote, current_shard_num, /* weight= */ 1);
         ++current_shard_num;
     }
 
@@ -553,15 +559,21 @@ Cluster::Cluster(
 
         addresses_with_failover.emplace_back(current);
 
-        addShard(settings, std::move(current), params.treat_local_as_remote, current_shard_num, /* insert_paths= */ {}, /* weight= */ 1);
+        addShard(settings, std::move(current), params.treat_local_as_remote, current_shard_num, /* weight= */ 1);
         ++current_shard_num;
     }
 
     initMisc();
 }
 
-void Cluster::addShard(const Settings & settings, Addresses && addresses, bool treat_local_as_remote, UInt32 current_shard_num,
-                       ShardInfoInsertPathForInternalReplication && insert_paths, UInt32 weight, bool internal_replication)
+void Cluster::addShard(
+    const Settings & settings,
+    Addresses addresses,
+    bool treat_local_as_remote,
+    UInt32 current_shard_num,
+    UInt32 weight,
+    ShardInfoInsertPathForInternalReplication insert_paths,
+    bool internal_replication)
 {
     Addresses shard_local_addresses;
 
@@ -572,19 +584,28 @@ void Cluster::addShard(const Settings & settings, Addresses && addresses, bool t
     {
         auto replica_pool = ConnectionPoolFactory::instance().get(
             static_cast<unsigned>(settings.distributed_connections_pool_size),
-            replica.host_name, replica.port,
-            replica.default_database, replica.user, replica.password, replica.quota_key,
-            replica.cluster, replica.cluster_secret,
-            "server", replica.compression,
-            replica.secure, replica.priority);
+            replica.host_name,
+            replica.port,
+            replica.default_database,
+            replica.user,
+            replica.password,
+            replica.quota_key,
+            replica.cluster,
+            replica.cluster_secret,
+            "server",
+            replica.compression,
+            replica.secure,
+            replica.priority);
 
         all_replicas_pools.emplace_back(replica_pool);
         if (replica.is_local && !treat_local_as_remote)
             shard_local_addresses.push_back(replica);
     }
     ConnectionPoolWithFailoverPtr shard_pool = std::make_shared<ConnectionPoolWithFailover>(
-        all_replicas_pools, settings.load_balancing,
-        settings.distributed_replica_error_half_life.totalSeconds(), settings.distributed_replica_error_cap);
+        all_replicas_pools,
+        settings.load_balancing,
+        settings.distributed_replica_error_half_life.totalSeconds(),
+        settings.distributed_replica_error_cap);
 
     if (weight)
         slot_to_shard.insert(std::end(slot_to_shard), weight, shards_info.size());
diff --git a/src/Interpreters/Cluster.h b/src/Interpreters/Cluster.h
index b2bc03dd74d..dc5790ac339 100644
--- a/src/Interpreters/Cluster.h
+++ b/src/Interpreters/Cluster.h
@@ -291,8 +291,14 @@ private:
     struct ReplicasAsShardsTag {};
     Cluster(ReplicasAsShardsTag, const Cluster & from, const Settings & settings, size_t max_replicas_from_shard);
 
-    void addShard(const Settings & settings, Addresses && addresses, bool treat_local_as_remote, UInt32 current_shard_num,
-                  ShardInfoInsertPathForInternalReplication && insert_paths = {}, UInt32 weight = 1, bool internal_replication = false);
+    void addShard(
+        const Settings & settings,
+        Addresses addresses,
+        bool treat_local_as_remote,
+        UInt32 current_shard_num,
+        UInt32 weight = 1,
+        ShardInfoInsertPathForInternalReplication insert_paths = {},
+        bool internal_replication = false);
 
     /// Inter-server secret
     String secret;
diff --git a/src/Interpreters/ClusterProxy/SelectStreamFactory.h b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
index 938f683f209..511b0dfaadb 100644
--- a/src/Interpreters/ClusterProxy/SelectStreamFactory.h
+++ b/src/Interpreters/ClusterProxy/SelectStreamFactory.h
@@ -80,15 +80,6 @@ public:
         UInt32 shard_count,
         bool parallel_replicas_enabled);
 
-    struct ShardPlans
-    {
-        /// If a shard has local replicas this won't be nullptr
-        std::unique_ptr<QueryPlan> local_plan;
-
-        /// Contains several steps to read from all remote replicas
-        std::unique_ptr<QueryPlan> remote_plan;
-    };
-
     const Block header;
     const ColumnsDescriptionByShardNum objects_by_shard;
     const StorageSnapshotPtr storage_snapshot;
diff --git a/src/Interpreters/ClusterProxy/executeQuery.cpp b/src/Interpreters/ClusterProxy/executeQuery.cpp
index 420bb447027..18f7280dd19 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.cpp
+++ b/src/Interpreters/ClusterProxy/executeQuery.cpp
@@ -21,6 +21,7 @@
 #include <Storages/MergeTree/ParallelReplicasReadingCoordinator.h>
 #include <Storages/SelectQueryInfo.h>
 #include <Storages/StorageReplicatedMergeTree.h>
+#include <Storages/Distributed/DistributedSettings.h>
 
 
 namespace DB
@@ -30,6 +31,7 @@ namespace ErrorCodes
 {
     extern const int TOO_LARGE_DISTRIBUTED_DEPTH;
     extern const int LOGICAL_ERROR;
+    extern const int CLUSTER_DOESNT_EXIST;
 }
 
 namespace ClusterProxy
@@ -40,7 +42,8 @@ ContextMutablePtr updateSettingsForCluster(const Cluster & cluster,
     const Settings & settings,
     const StorageID & main_table,
     ASTPtr additional_filter_ast,
-    Poco::Logger * log)
+    Poco::Logger * log,
+    const DistributedSettings * distributed_settings)
 {
     Settings new_settings = settings;
     new_settings.queue_max_wait_ms = Cluster::saturate(new_settings.queue_max_wait_ms, settings.max_execution_time);
@@ -100,6 +103,12 @@ ContextMutablePtr updateSettingsForCluster(const Cluster & cluster,
         }
     }
 
+    if (!settings.skip_unavailable_shards.changed && distributed_settings)
+    {
+        new_settings.skip_unavailable_shards = distributed_settings->skip_unavailable_shards.value;
+        new_settings.skip_unavailable_shards.changed = true;
+    }
+
     if (settings.offset)
     {
         new_settings.offset = 0;
@@ -126,7 +135,7 @@ ContextMutablePtr updateSettingsForCluster(const Cluster & cluster,
     }
 
     /// disable parallel replicas if cluster contains only shards with 1 replica
-    if (context->canUseParallelReplicas())
+    if (context->canUseTaskBasedParallelReplicas())
     {
         bool disable_parallel_replicas = true;
         for (const auto & shard : cluster.getShardsInfo())
@@ -185,11 +194,15 @@ void executeQuery(
     QueryProcessingStage::Enum processed_stage,
     const StorageID & main_table,
     const ASTPtr & table_func_ptr,
-    SelectStreamFactory & stream_factory, Poco::Logger * log,
-    const ASTPtr & query_ast, ContextPtr context, const SelectQueryInfo & query_info,
+    SelectStreamFactory & stream_factory,
+    Poco::Logger * log,
+    const ASTPtr & query_ast,
+    ContextPtr context,
+    const SelectQueryInfo & query_info,
     const ExpressionActionsPtr & sharding_key_expr,
     const std::string & sharding_key_column_name,
     const ClusterPtr & not_optimized_cluster,
+    const DistributedSettings & distributed_settings,
     AdditionalShardFilterGenerator shard_filter_generator)
 {
     const Settings & settings = context->getSettingsRef();
@@ -201,7 +214,8 @@ void executeQuery(
     SelectStreamFactory::Shards remote_shards;
 
     auto cluster = query_info.getCluster();
-    auto new_context = updateSettingsForCluster(*cluster, context, settings, main_table, query_info.additional_filter_ast, log);
+    auto new_context = updateSettingsForCluster(*cluster, context, settings, main_table, query_info.additional_filter_ast, log,
+        &distributed_settings);
     if (context->getSettingsRef().allow_experimental_parallel_reading_from_replicas
         && context->getSettingsRef().allow_experimental_parallel_reading_from_replicas.value
            != new_context->getSettingsRef().allow_experimental_parallel_reading_from_replicas.value)
@@ -251,11 +265,17 @@ void executeQuery(
         // decide for each shard if parallel reading from replicas should be enabled
         // according to settings and number of replicas declared per shard
         const auto & addresses = cluster->getShardsAddresses().at(i);
-        bool parallel_replicas_enabled = addresses.size() > 1 && context->canUseParallelReplicas();
+        bool parallel_replicas_enabled = addresses.size() > 1 && context->canUseTaskBasedParallelReplicas();
 
-        stream_factory.createForShard(shard_info,
-            query_ast_for_shard, main_table, table_func_ptr,
-            new_context, plans, remote_shards, static_cast<UInt32>(shards),
+        stream_factory.createForShard(
+            shard_info,
+            query_ast_for_shard,
+            main_table,
+            table_func_ptr,
+            new_context,
+            plans,
+            remote_shards,
+            static_cast<UInt32>(shards),
             parallel_replicas_enabled);
     }
 
@@ -313,11 +333,44 @@ void executeQueryWithParallelReplicas(
     SelectStreamFactory & stream_factory,
     const ASTPtr & query_ast,
     ContextPtr context,
-    std::shared_ptr<const StorageLimitsList> storage_limits,
-    const ClusterPtr & not_optimized_cluster)
+    std::shared_ptr<const StorageLimitsList> storage_limits)
 {
     const auto & settings = context->getSettingsRef();
+
+    /// check cluster for parallel replicas
+    if (settings.cluster_for_parallel_replicas.value.empty())
+    {
+        throw Exception(
+            ErrorCodes::CLUSTER_DOESNT_EXIST,
+            "Reading in parallel from replicas is enabled but cluster to execute query is not provided. Please set "
+            "'cluster_for_parallel_replicas' setting");
+    }
+    auto not_optimized_cluster = context->getCluster(settings.cluster_for_parallel_replicas);
+
     auto new_context = Context::createCopy(context);
+
+    /// check hedged connections setting
+    if (settings.use_hedged_requests.value)
+    {
+        if (settings.use_hedged_requests.changed)
+        {
+            LOG_WARNING(
+                &Poco::Logger::get("executeQueryWithParallelReplicas"),
+                "Setting 'use_hedged_requests' explicitly with enabled 'allow_experimental_parallel_reading_from_replicas' has no effect. "
+                "Hedged connections are not used for parallel reading from replicas");
+        }
+        else
+        {
+            LOG_INFO(
+                &Poco::Logger::get("executeQueryWithParallelReplicas"),
+                "Disabling 'use_hedged_requests' in favor of 'allow_experimental_parallel_reading_from_replicas'. Hedged connections are "
+                "not used for parallel reading from replicas");
+        }
+
+        /// disable hedged connections -> parallel replicas uses own logic to choose replicas
+        new_context->setSetting("use_hedged_requests", Field{false});
+    }
+
     auto scalars = new_context->hasQueryContext() ? new_context->getQueryContext()->getScalars() : Scalars{};
 
     UInt64 shard_num = 0; /// shard_num is 1-based, so 0 - no shard specified
@@ -329,7 +382,6 @@ void executeQueryWithParallelReplicas(
         shard_num = column->getUInt(0);
     }
 
-    size_t all_replicas_count = 0;
     ClusterPtr new_cluster;
     /// if got valid shard_num from query initiator, then parallel replicas scope is the specified shard
     /// shards are numbered in order of appearance in the cluster config
@@ -353,16 +405,14 @@ void executeQueryWithParallelReplicas(
         // shard_num is 1-based, but getClusterWithSingleShard expects 0-based index
         auto single_shard_cluster = not_optimized_cluster->getClusterWithSingleShard(shard_num - 1);
         // convert cluster to representation expected by parallel replicas
-        new_cluster = single_shard_cluster->getClusterWithReplicasAsShards(settings);
+        new_cluster = single_shard_cluster->getClusterWithReplicasAsShards(settings, settings.max_parallel_replicas);
     }
     else
     {
-        new_cluster = not_optimized_cluster->getClusterWithReplicasAsShards(settings);
+        new_cluster = not_optimized_cluster->getClusterWithReplicasAsShards(settings, settings.max_parallel_replicas);
     }
 
-    all_replicas_count = std::min(static_cast<size_t>(settings.max_parallel_replicas), new_cluster->getShardCount());
-
-    auto coordinator = std::make_shared<ParallelReplicasReadingCoordinator>(all_replicas_count);
+    auto coordinator = std::make_shared<ParallelReplicasReadingCoordinator>(new_cluster->getShardCount());
     auto external_tables = new_context->getExternalTables();
     auto read_from_remote = std::make_unique<ReadFromParallelRemoteReplicasStep>(
         query_ast,
diff --git a/src/Interpreters/ClusterProxy/executeQuery.h b/src/Interpreters/ClusterProxy/executeQuery.h
index bdca75be31d..1fc49057e07 100644
--- a/src/Interpreters/ClusterProxy/executeQuery.h
+++ b/src/Interpreters/ClusterProxy/executeQuery.h
@@ -8,6 +8,7 @@ namespace DB
 {
 
 struct Settings;
+struct DistributedSettings;
 class Cluster;
 using ClusterPtr = std::shared_ptr<Cluster>;
 struct SelectQueryInfo;
@@ -42,7 +43,8 @@ ContextMutablePtr updateSettingsForCluster(const Cluster & cluster,
     const Settings & settings,
     const StorageID & main_table,
     ASTPtr additional_filter_ast = nullptr,
-    Poco::Logger * log = nullptr);
+    Poco::Logger * log = nullptr,
+    const DistributedSettings * distributed_settings = nullptr);
 
 using AdditionalShardFilterGenerator = std::function<ASTPtr(uint64_t)>;
 /// Execute a distributed query, creating a query plan, from which the query pipeline can be built.
@@ -54,11 +56,15 @@ void executeQuery(
     QueryProcessingStage::Enum processed_stage,
     const StorageID & main_table,
     const ASTPtr & table_func_ptr,
-    SelectStreamFactory & stream_factory, Poco::Logger * log,
-    const ASTPtr & query_ast, ContextPtr context, const SelectQueryInfo & query_info,
+    SelectStreamFactory & stream_factory,
+    Poco::Logger * log,
+    const ASTPtr & query_ast,
+    ContextPtr context,
+    const SelectQueryInfo & query_info,
     const ExpressionActionsPtr & sharding_key_expr,
     const std::string & sharding_key_column_name,
     const ClusterPtr & not_optimized_cluster,
+    const DistributedSettings & distributed_settings,
     AdditionalShardFilterGenerator shard_filter_generator = {});
 
 
@@ -68,8 +74,7 @@ void executeQueryWithParallelReplicas(
     SelectStreamFactory & stream_factory,
     const ASTPtr & query_ast,
     ContextPtr context,
-    std::shared_ptr<const StorageLimitsList> storage_limits,
-    const ClusterPtr & not_optimized_cluster);
+    std::shared_ptr<const StorageLimitsList> storage_limits);
 }
 
 }
diff --git a/src/Interpreters/ConcurrentHashJoin.cpp b/src/Interpreters/ConcurrentHashJoin.cpp
index 1a8e0ad96fa..8e73bc8b484 100644
--- a/src/Interpreters/ConcurrentHashJoin.cpp
+++ b/src/Interpreters/ConcurrentHashJoin.cpp
@@ -44,7 +44,8 @@ ConcurrentHashJoin::ConcurrentHashJoin(ContextPtr context_, std::shared_ptr<Tabl
     for (size_t i = 0; i < slots; ++i)
     {
         auto inner_hash_join = std::make_shared<InternalHashJoin>();
-        inner_hash_join->data = std::make_unique<HashJoin>(table_join_, right_sample_block, any_take_last_row_);
+
+        inner_hash_join->data = std::make_unique<HashJoin>(table_join_, right_sample_block, any_take_last_row_, 0, fmt::format("concurrent{}", i));
         hash_joins.emplace_back(std::move(inner_hash_join));
     }
 }
diff --git a/src/Interpreters/Context.cpp b/src/Interpreters/Context.cpp
index 0a8a8f1f529..e9962d08160 100644
--- a/src/Interpreters/Context.cpp
+++ b/src/Interpreters/Context.cpp
@@ -3,7 +3,6 @@
 #include <optional>
 #include <memory>
 #include <Poco/UUID.h>
-#include <Poco/Net/NameValueCollection.h>
 #include <Poco/Util/Application.h>
 #include <Common/AsyncLoader.h>
 #include <Common/PoolId.h>
@@ -36,6 +35,7 @@
 #include <Disks/ObjectStorages/DiskObjectStorage.h>
 #include <Disks/ObjectStorages/IObjectStorage.h>
 #include <Disks/StoragePolicy.h>
+#include <Disks/IO/IOUringReader.h>
 #include <IO/SynchronousReader.h>
 #include <TableFunctions/TableFunctionFactory.h>
 #include <Interpreters/ActionLocksManager.h>
@@ -65,8 +65,8 @@
 #include <Interpreters/EmbeddedDictionaries.h>
 #include <Interpreters/ExternalDictionariesLoader.h>
 #include <Functions/UserDefined/ExternalUserDefinedExecutableFunctionsLoader.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
-#include <Functions/UserDefined/createUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
+#include <Functions/UserDefined/createUserDefinedSQLObjectsStorage.h>
 #include <Interpreters/ProcessList.h>
 #include <Interpreters/InterserverCredentials.h>
 #include <Interpreters/Cluster.h>
@@ -77,6 +77,7 @@
 #include <Interpreters/Session.h>
 #include <Interpreters/TraceCollector.h>
 #include <IO/ReadBufferFromFile.h>
+#include <IO/ReadWriteBufferFromHTTP.h>
 #include <IO/UncompressedCache.h>
 #include <IO/MMappedFileCache.h>
 #include <IO/WriteSettings.h>
@@ -97,6 +98,7 @@
 #include <Interpreters/JIT/CompiledExpressionCache.h>
 #include <Storages/MergeTree/BackgroundJobsAssignee.h>
 #include <Storages/MergeTree/MergeTreeDataPartUUID.h>
+#include <Storages/MaterializedView/RefreshSet.h>
 #include <Interpreters/SynonymsExtensions.h>
 #include <Interpreters/Lemmatizers.h>
 #include <Interpreters/ClusterDiscovery.h>
@@ -152,6 +154,9 @@ namespace CurrentMetrics
     extern const Metric TablesLoaderForegroundThreadsActive;
     extern const Metric TablesLoaderForegroundThreadsScheduled;
     extern const Metric IOWriterThreadsScheduled;
+    extern const Metric AttachedTable;
+    extern const Metric AttachedDatabase;
+    extern const Metric PartsActive;
 }
 
 
@@ -210,8 +215,6 @@ struct ContextSharedPart : boost::noncopyable
     mutable zkutil::ZooKeeperPtr zookeeper TSA_GUARDED_BY(zookeeper_mutex);                 /// Client for ZooKeeper.
     ConfigurationPtr zookeeper_config TSA_GUARDED_BY(zookeeper_mutex);                      /// Stores zookeeper configs
 
-    ConfigurationPtr sensitive_data_masker_config;
-
 #if USE_NURAFT
     mutable std::mutex keeper_dispatcher_mutex;
     mutable std::shared_ptr<KeeperDispatcher> keeper_dispatcher TSA_GUARDED_BY(keeper_dispatcher_mutex);
@@ -253,8 +256,8 @@ struct ContextSharedPart : boost::noncopyable
     ExternalLoaderXMLConfigRepository * user_defined_executable_functions_config_repository TSA_GUARDED_BY(external_user_defined_executable_functions_mutex) = nullptr;
     scope_guard user_defined_executable_functions_xmls TSA_GUARDED_BY(external_user_defined_executable_functions_mutex);
 
-    mutable OnceFlag user_defined_sql_objects_loader_initialized;
-    mutable std::unique_ptr<IUserDefinedSQLObjectsLoader> user_defined_sql_objects_loader;
+    mutable OnceFlag user_defined_sql_objects_storage_initialized;
+    mutable std::unique_ptr<IUserDefinedSQLObjectsStorage> user_defined_sql_objects_storage;
 
 #if USE_NLP
     mutable OnceFlag synonyms_extensions_initialized;
@@ -290,6 +293,7 @@ struct ContextSharedPart : boost::noncopyable
     MergeList merge_list;                                       /// The list of executable merge (for (Replicated)?MergeTree)
     MovesList moves_list;                                       /// The list of executing moves (for (Replicated)?MergeTree)
     ReplicatedFetchList replicated_fetch_list;
+    RefreshSet refresh_set;                                 /// The list of active refreshes (for MaterializedView)
     ConfigurationPtr users_config TSA_GUARDED_BY(mutex);                              /// Config with the users, profiles and quotas sections.
     InterserverIOHandler interserver_io_handler;                /// Handler for interserver communication.
 
@@ -310,6 +314,11 @@ struct ContextSharedPart : boost::noncopyable
     mutable OnceFlag threadpool_writer_initialized;
     mutable std::unique_ptr<ThreadPool> threadpool_writer;
 
+#if USE_LIBURING
+    mutable OnceFlag io_uring_reader_initialized;
+    mutable std::unique_ptr<IOUringReader> io_uring_reader;
+#endif
+
     mutable ThrottlerPtr replicated_fetches_throttler;      /// A server-wide throttler for replicated fetches
     mutable ThrottlerPtr replicated_sends_throttler;        /// A server-wide throttler for replicated sends
 
@@ -336,10 +345,11 @@ struct ContextSharedPart : boost::noncopyable
     std::optional<MergeTreeSettings> merge_tree_settings TSA_GUARDED_BY(mutex);   /// Settings of MergeTree* engines.
     std::optional<MergeTreeSettings> replicated_merge_tree_settings TSA_GUARDED_BY(mutex);   /// Settings of ReplicatedMergeTree* engines.
     std::atomic_size_t max_table_size_to_drop = 50000000000lu; /// Protects MergeTree tables from accidental DROP (50GB by default)
-    std::unordered_set<String> get_client_http_header_forbidden_headers;
-    bool allow_get_client_http_header;
     std::atomic_size_t max_partition_size_to_drop = 50000000000lu; /// Protects MergeTree partitions from accidental DROP (50GB by default)
     /// No lock required for format_schema_path modified only during initialization
+    std::atomic_size_t max_database_num_to_warn = 1000lu;
+    std::atomic_size_t max_table_num_to_warn = 5000lu;
+    std::atomic_size_t max_part_num_to_warn = 100000lu;
     String format_schema_path;                              /// Path to a directory that contains schema files used by input formats.
     String google_protos_path; /// Path to a directory that contains the proto files for the well-known Protobuf types.
     mutable OnceFlag action_locks_manager_initialized;
@@ -357,6 +367,8 @@ struct ContextSharedPart : boost::noncopyable
     OrdinaryBackgroundExecutorPtr moves_executor TSA_GUARDED_BY(background_executors_mutex);
     OrdinaryBackgroundExecutorPtr fetch_executor TSA_GUARDED_BY(background_executors_mutex);
     OrdinaryBackgroundExecutorPtr common_executor TSA_GUARDED_BY(background_executors_mutex);
+    /// The global pool of HTTP sessions for background fetches.
+    PooledSessionFactoryPtr fetches_session_factory TSA_GUARDED_BY(background_executors_mutex);
 
     RemoteHostFilter remote_host_filter TSA_GUARDED_BY(mutex);                    /// Allowed URL from config.xml
     HTTPHeaderFilter http_header_filter TSA_GUARDED_BY(mutex);                    /// Forbidden HTTP headers from config.xml
@@ -370,6 +382,7 @@ struct ContextSharedPart : boost::noncopyable
     std::shared_ptr<Clusters> clusters TSA_GUARDED_BY(clusters_mutex);
     ConfigurationPtr clusters_config TSA_GUARDED_BY(clusters_mutex);                        /// Stores updated configs
     std::unique_ptr<ClusterDiscovery> cluster_discovery TSA_GUARDED_BY(clusters_mutex);
+    size_t clusters_version TSA_GUARDED_BY(clusters_mutex) = 0;
 
     /// No lock required for async_insert_queue modified only during initialization
     std::shared_ptr<AsynchronousInsertQueue> async_insert_queue;
@@ -545,7 +558,7 @@ struct ContextSharedPart : boost::noncopyable
 
         SHUTDOWN(log, "dictionaries loader", external_dictionaries_loader, enablePeriodicUpdates(false));
         SHUTDOWN(log, "UDFs loader", external_user_defined_executable_functions_loader, enablePeriodicUpdates(false));
-        SHUTDOWN(log, "another UDFs loader", user_defined_sql_objects_loader, stopWatching());
+        SHUTDOWN(log, "another UDFs storage", user_defined_sql_objects_storage, stopWatching());
 
         LOG_TRACE(log, "Shutting down named sessions");
         Session::shutdownNamedSessions();
@@ -572,7 +585,7 @@ struct ContextSharedPart : boost::noncopyable
         std::unique_ptr<EmbeddedDictionaries> delete_embedded_dictionaries;
         std::unique_ptr<ExternalDictionariesLoader> delete_external_dictionaries_loader;
         std::unique_ptr<ExternalUserDefinedExecutableFunctionsLoader> delete_external_user_defined_executable_functions_loader;
-        std::unique_ptr<IUserDefinedSQLObjectsLoader> delete_user_defined_sql_objects_loader;
+        std::unique_ptr<IUserDefinedSQLObjectsStorage> delete_user_defined_sql_objects_storage;
         std::unique_ptr<BackgroundSchedulePool> delete_buffer_flush_schedule_pool;
         std::unique_ptr<BackgroundSchedulePool> delete_schedule_pool;
         std::unique_ptr<BackgroundSchedulePool> delete_distributed_schedule_pool;
@@ -652,7 +665,7 @@ struct ContextSharedPart : boost::noncopyable
             delete_embedded_dictionaries = std::move(embedded_dictionaries);
             delete_external_dictionaries_loader = std::move(external_dictionaries_loader);
             delete_external_user_defined_executable_functions_loader = std::move(external_user_defined_executable_functions_loader);
-            delete_user_defined_sql_objects_loader = std::move(user_defined_sql_objects_loader);
+            delete_user_defined_sql_objects_storage = std::move(user_defined_sql_objects_storage);
             delete_buffer_flush_schedule_pool = std::move(buffer_flush_schedule_pool);
             delete_schedule_pool = std::move(schedule_pool);
             delete_distributed_schedule_pool = std::move(distributed_schedule_pool);
@@ -670,7 +683,7 @@ struct ContextSharedPart : boost::noncopyable
         delete_embedded_dictionaries.reset();
         delete_external_dictionaries_loader.reset();
         delete_external_user_defined_executable_functions_loader.reset();
-        delete_user_defined_sql_objects_loader.reset();
+        delete_user_defined_sql_objects_storage.reset();
         delete_ddl_worker.reset();
         delete_buffer_flush_schedule_pool.reset();
         delete_schedule_pool.reset();
@@ -817,6 +830,8 @@ MovesList & Context::getMovesList() { return shared->moves_list; }
 const MovesList & Context::getMovesList() const { return shared->moves_list; }
 ReplicatedFetchList & Context::getReplicatedFetchList() { return shared->replicated_fetch_list; }
 const ReplicatedFetchList & Context::getReplicatedFetchList() const { return shared->replicated_fetch_list; }
+RefreshSet & Context::getRefreshSet() { return shared->refresh_set; }
+const RefreshSet & Context::getRefreshSet() const { return shared->refresh_set; }
 
 String Context::resolveDatabase(const String & database_name) const
 {
@@ -868,6 +883,12 @@ Strings Context::getWarnings() const
     {
         SharedLockGuard lock(shared->mutex);
         common_warnings = shared->warnings;
+        if (CurrentMetrics::get(CurrentMetrics::AttachedTable) > static_cast<DB::Int64>(shared->max_table_num_to_warn))
+            common_warnings.emplace_back(fmt::format("The number of attached tables is more than {}", shared->max_table_num_to_warn));
+        if (CurrentMetrics::get(CurrentMetrics::AttachedDatabase) > static_cast<DB::Int64>(shared->max_database_num_to_warn))
+            common_warnings.emplace_back(fmt::format("The number of attached databases is more than {}", shared->max_table_num_to_warn));
+        if (CurrentMetrics::get(CurrentMetrics::PartsActive) > static_cast<DB::Int64>(shared->max_part_num_to_warn))
+            common_warnings.emplace_back(fmt::format("The number of active parts is more than {}", shared->max_part_num_to_warn));
     }
     /// Make setting's name ordered
     std::set<String> obsolete_settings;
@@ -1078,7 +1099,7 @@ void Context::setTemporaryStorageInCache(const String & cache_disk_name, size_t
     if (shared->root_temp_data_on_disk)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Temporary storage is already set");
 
-    auto file_cache = FileCacheFactory::instance().getByName(disk_ptr->getCacheName()).cache;
+    auto file_cache = FileCacheFactory::instance().getByName(disk_ptr->getCacheName())->cache;
     if (!file_cache)
         throw Exception(ErrorCodes::NO_ELEMENTS_IN_CONFIG, "Cache '{}' is not found", disk_ptr->getCacheName());
 
@@ -2448,24 +2469,30 @@ void Context::loadOrReloadUserDefinedExecutableFunctions(const Poco::Util::Abstr
     shared->user_defined_executable_functions_xmls = external_user_defined_executable_functions_loader.addConfigRepository(std::move(repository));
 }
 
-const IUserDefinedSQLObjectsLoader & Context::getUserDefinedSQLObjectsLoader() const
+const IUserDefinedSQLObjectsStorage & Context::getUserDefinedSQLObjectsStorage() const
 {
-    callOnce(shared->user_defined_sql_objects_loader_initialized, [&] {
-        shared->user_defined_sql_objects_loader = createUserDefinedSQLObjectsLoader(getGlobalContext());
+    callOnce(shared->user_defined_sql_objects_storage_initialized, [&] {
+        shared->user_defined_sql_objects_storage = createUserDefinedSQLObjectsStorage(getGlobalContext());
     });
 
     SharedLockGuard lock(shared->mutex);
-    return *shared->user_defined_sql_objects_loader;
+    return *shared->user_defined_sql_objects_storage;
 }
 
-IUserDefinedSQLObjectsLoader & Context::getUserDefinedSQLObjectsLoader()
+IUserDefinedSQLObjectsStorage & Context::getUserDefinedSQLObjectsStorage()
 {
-    callOnce(shared->user_defined_sql_objects_loader_initialized, [&] {
-        shared->user_defined_sql_objects_loader = createUserDefinedSQLObjectsLoader(getGlobalContext());
+    callOnce(shared->user_defined_sql_objects_storage_initialized, [&] {
+        shared->user_defined_sql_objects_storage = createUserDefinedSQLObjectsStorage(getGlobalContext());
     });
 
-    SharedLockGuard lock(shared->mutex);
-    return *shared->user_defined_sql_objects_loader;
+    std::lock_guard lock(shared->mutex);
+    return *shared->user_defined_sql_objects_storage;
+}
+
+void Context::setUserDefinedSQLObjectsStorage(std::unique_ptr<IUserDefinedSQLObjectsStorage> storage)
+{
+    std::lock_guard lock(shared->mutex);
+    shared->user_defined_sql_objects_storage = std::move(storage);
 }
 
 #if USE_NLP
@@ -3319,16 +3346,6 @@ bool Context::hasAuxiliaryZooKeeper(const String & name) const
     return getConfigRef().has("auxiliary_zookeepers." + name);
 }
 
-void Context::reloadQueryMaskingRulesIfChanged(const ConfigurationPtr & config) const
-{
-    const auto old_config = shared->sensitive_data_masker_config;
-    if (old_config && isSameConfiguration(*config, *old_config, "query_masking_rules"))
-        return;
-
-    SensitiveDataMasker::setInstance(std::make_unique<SensitiveDataMasker>(*config, "query_masking_rules"));
-    shared->sensitive_data_masker_config = config;
-}
-
 InterserverCredentialsPtr Context::getInterserverCredentials() const
 {
     return shared->interserver_io_credentials.get();
@@ -3418,6 +3435,24 @@ UInt16 Context::getServerPort(const String & port_name) const
         return it->second;
 }
 
+void Context::setMaxPartNumToWarn(size_t max_part_to_warn)
+{
+    SharedLockGuard lock(shared->mutex);
+    shared->max_part_num_to_warn = max_part_to_warn;
+}
+
+void Context::setMaxTableNumToWarn(size_t max_table_to_warn)
+{
+    SharedLockGuard lock(shared->mutex);
+    shared->max_table_num_to_warn= max_table_to_warn;
+}
+
+void Context::setMaxDatabaseNumToWarn(size_t max_database_to_warn)
+{
+    SharedLockGuard lock(shared->mutex);
+    shared->max_database_num_to_warn= max_database_to_warn;
+}
+
 std::shared_ptr<Cluster> Context::getCluster(const std::string & cluster_name) const
 {
     if (auto res = tryGetCluster(cluster_name))
@@ -3526,6 +3561,14 @@ void Context::setClustersConfig(const ConfigurationPtr & config, bool enable_dis
         shared->clusters = std::make_shared<Clusters>(*shared->clusters_config, settings, getMacros(), config_name);
     else
         shared->clusters->updateClusters(*shared->clusters_config, settings, config_name, old_clusters_config);
+
+    ++shared->clusters_version;
+}
+
+size_t Context::getClustersVersion() const
+{
+    std::lock_guard lock(shared->clusters_mutex);
+    return shared->clusters_version;
 }
 
 
@@ -4017,7 +4060,8 @@ void Context::checkCanBeDropped(const String & database, const String & table, c
                     "2. File '{}' intended to force DROP {}\n"
                     "How to fix this:\n"
                     "1. Either increase (or set to zero) max_[table/partition]_size_to_drop in server config\n"
-                    "2. Either create forcing file {} and make sure that ClickHouse has write permission for it.\n"
+                    "2. Either pass a bigger (or set to zero) max_[table/partition]_size_to_drop through query settings\n"
+                    "3. Either create forcing file {} and make sure that ClickHouse has write permission for it.\n"
                     "Example:\nsudo touch '{}' && sudo chmod 666 '{}'",
                     backQuoteIfNeed(database), backQuoteIfNeed(table),
                     size_str, max_size_to_drop_str,
@@ -4045,27 +4089,9 @@ void Context::checkTableCanBeDropped(const String & database, const String & tab
     checkCanBeDropped(database, table, table_size, max_table_size_to_drop);
 }
 
-
-void Context::setClientHTTPHeaderForbiddenHeaders(const String & forbidden_headers)
+void Context::checkTableCanBeDropped(const String & database, const String & table, const size_t & table_size, const size_t & max_table_size_to_drop) const
 {
-    std::unordered_set<String> forbidden_header_list;
-    boost::split(forbidden_header_list, forbidden_headers, [](char c) { return c == ','; });
-    shared->get_client_http_header_forbidden_headers = forbidden_header_list;
-}
-
-void Context::setAllowGetHTTPHeaderFunction(bool allow_get_http_header_function)
-{
-    shared->allow_get_client_http_header= allow_get_http_header_function;
-}
-
-const std::unordered_set<String> & Context::getClientHTTPHeaderForbiddenHeaders() const
-{
-    return shared->get_client_http_header_forbidden_headers;
-}
-
-bool Context::allowGetHTTPHeaderFunction() const
-{
-    return shared->allow_get_client_http_header;
+    checkCanBeDropped(database, table, table_size, max_table_size_to_drop);
 }
 
 void Context::setMaxPartitionSizeToDrop(size_t max_size)
@@ -4086,6 +4112,10 @@ void Context::checkPartitionCanBeDropped(const String & database, const String &
     checkCanBeDropped(database, table, partition_size, max_partition_size_to_drop);
 }
 
+void Context::checkPartitionCanBeDropped(const String & database, const String & table, const size_t & partition_size, const size_t & max_partition_size_to_drop) const
+{
+    checkCanBeDropped(database, table, partition_size, max_partition_size_to_drop);
+}
 
 InputFormatPtr Context::getInputFormat(const String & name, ReadBuffer & buf, const Block & sample, UInt64 max_block_size, const std::optional<FormatSettings> & format_settings, const std::optional<size_t> max_parsing_threads) const
 {
@@ -4378,15 +4408,12 @@ void Context::setClientConnectionId(uint32_t connection_id_)
     client_info.connection_id = connection_id_;
 }
 
-void Context::setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer, const Poco::Net::NameValueCollection & http_headers)
+void Context::setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer)
 {
     client_info.http_method = http_method;
     client_info.http_user_agent = http_user_agent;
     client_info.http_referer = http_referer;
     need_recalculate_access = true;
-
-    if (!http_headers.empty())
-        client_info.headers = http_headers;
 }
 
 void Context::setForwardedFor(const String & forwarded_for)
@@ -4519,7 +4546,7 @@ StorageID Context::resolveStorageIDImpl(StorageID storage_id, StorageNamespace w
     if (!storage_id)
     {
         if (exception)
-            exception->emplace(ErrorCodes::UNKNOWN_TABLE, "Both table name and UUID are empty");
+            exception->emplace(Exception(ErrorCodes::UNKNOWN_TABLE, "Both table name and UUID are empty"));
         return storage_id;
     }
 
@@ -4580,7 +4607,7 @@ StorageID Context::resolveStorageIDImpl(StorageID storage_id, StorageNamespace w
         if (current_database.empty())
         {
             if (exception)
-                exception->emplace(ErrorCodes::UNKNOWN_DATABASE, "Default database is not selected");
+                exception->emplace(Exception(ErrorCodes::UNKNOWN_DATABASE, "Default database is not selected"));
             return StorageID::createEmpty();
         }
         storage_id.database_name = current_database;
@@ -4807,6 +4834,11 @@ void Context::initializeBackgroundExecutorsIfNeeded()
     );
     LOG_INFO(shared->log, "Initialized background executor for move operations with num_threads={}, num_tasks={}", background_move_pool_size, background_move_pool_size);
 
+    auto timeouts = ConnectionTimeouts::getFetchPartHTTPTimeouts(getServerSettings(), getSettingsRef());
+    /// The number of background fetches is limited by the number of threads in the background thread pool.
+    /// It doesn't make any sense to limit the number of connections per host any further.
+    shared->fetches_session_factory = std::make_shared<PooledSessionFactory>(timeouts, background_fetches_pool_size);
+
     shared->fetch_executor = std::make_shared<OrdinaryBackgroundExecutor>
     (
         "Fetch",
@@ -4830,7 +4862,7 @@ void Context::initializeBackgroundExecutorsIfNeeded()
     shared->are_background_executors_initialized = true;
 }
 
-bool Context::areBackgroundExecutorsInitialized()
+bool Context::areBackgroundExecutorsInitialized() const
 {
     SharedLockGuard lock(shared->background_executors_mutex);
     return shared->are_background_executors_initialized;
@@ -4860,6 +4892,12 @@ OrdinaryBackgroundExecutorPtr Context::getCommonExecutor() const
     return shared->common_executor;
 }
 
+PooledSessionFactoryPtr Context::getCommonFetchesSessionFactory() const
+{
+    SharedLockGuard lock(shared->background_executors_mutex);
+    return shared->fetches_session_factory;
+}
+
 IAsynchronousReader & Context::getThreadPoolReader(FilesystemReaderType type) const
 {
     callOnce(shared->readers_initialized, [&] {
@@ -4880,6 +4918,17 @@ IAsynchronousReader & Context::getThreadPoolReader(FilesystemReaderType type) co
     }
 }
 
+#if USE_LIBURING
+IOUringReader & Context::getIOURingReader() const
+{
+    callOnce(shared->io_uring_reader_initialized, [&] {
+        shared->io_uring_reader = std::make_unique<IOUringReader>(512);
+    });
+
+    return *shared->io_uring_reader;
+}
+#endif
+
 ThreadPool & Context::getThreadPoolWriter() const
 {
     callOnce(shared->threadpool_writer_initialized, [&] {
@@ -4954,6 +5003,7 @@ ReadSettings Context::getReadSettings() const
     res.http_retry_initial_backoff_ms = settings.http_retry_initial_backoff_ms;
     res.http_retry_max_backoff_ms = settings.http_retry_max_backoff_ms;
     res.http_skip_not_found_url_for_globs = settings.http_skip_not_found_url_for_globs;
+    res.http_make_head_request = settings.http_make_head_request;
 
     res.mmap_cache = getMMappedFileCache().get();
 
@@ -4992,13 +5042,13 @@ Context::ParallelReplicasMode Context::getParallelReplicasMode() const
     if (!settings_ref.parallel_replicas_custom_key.value.empty())
         return CUSTOM_KEY;
 
-    if (settings_ref.allow_experimental_parallel_reading_from_replicas > 0 && !settings_ref.use_hedged_requests)
+    if (settings_ref.allow_experimental_parallel_reading_from_replicas > 0)
         return READ_TASKS;
 
     return SAMPLE_KEY;
 }
 
-bool Context::canUseParallelReplicas() const
+bool Context::canUseTaskBasedParallelReplicas() const
 {
     const auto & settings_ref = getSettingsRef();
     return getParallelReplicasMode() == ParallelReplicasMode::READ_TASKS && settings_ref.max_parallel_replicas > 1;
@@ -5006,12 +5056,12 @@ bool Context::canUseParallelReplicas() const
 
 bool Context::canUseParallelReplicasOnInitiator() const
 {
-    return canUseParallelReplicas() && !getClientInfo().collaborate_with_initiator;
+    return canUseTaskBasedParallelReplicas() && !getClientInfo().collaborate_with_initiator;
 }
 
 bool Context::canUseParallelReplicasOnFollower() const
 {
-    return canUseParallelReplicas() && getClientInfo().collaborate_with_initiator;
+    return canUseTaskBasedParallelReplicas() && getClientInfo().collaborate_with_initiator;
 }
 
 void Context::setPreparedSetsCache(const PreparedSetsCachePtr & cache)
diff --git a/src/Interpreters/Context.h b/src/Interpreters/Context.h
index 8c169dd664f..b09eeb8ca2d 100644
--- a/src/Interpreters/Context.h
+++ b/src/Interpreters/Context.h
@@ -26,8 +26,6 @@
 #include <Server/HTTP/HTTPContext.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/IStorage_fwd.h>
-#include <Poco/Net/NameValueCollection.h>
-#include <Core/Types.h>
 
 #include "config.h"
 
@@ -68,7 +66,7 @@ enum class RowPolicyFilterType;
 class EmbeddedDictionaries;
 class ExternalDictionariesLoader;
 class ExternalUserDefinedExecutableFunctionsLoader;
-class IUserDefinedSQLObjectsLoader;
+class IUserDefinedSQLObjectsStorage;
 class InterserverCredentials;
 using InterserverCredentialsPtr = std::shared_ptr<const InterserverCredentials>;
 class InterserverIOHandler;
@@ -76,6 +74,7 @@ class BackgroundSchedulePool;
 class MergeList;
 class MovesList;
 class ReplicatedFetchList;
+class RefreshSet;
 class Cluster;
 class Compiler;
 class MarkCache;
@@ -111,6 +110,7 @@ class AsynchronousInsertLog;
 class BackupLog;
 class BlobStorageLog;
 class IAsynchronousReader;
+class IOUringReader;
 struct MergeTreeSettings;
 struct InitialAllRangesAnnouncement;
 struct ParallelReadRequest;
@@ -203,6 +203,9 @@ using TemporaryDataOnDiskScopePtr = std::shared_ptr<TemporaryDataOnDiskScope>;
 class PreparedSetsCache;
 using PreparedSetsCachePtr = std::shared_ptr<PreparedSetsCache>;
 
+class PooledSessionFactory;
+using PooledSessionFactoryPtr = std::shared_ptr<PooledSessionFactory>;
+
 class SessionTracker;
 
 struct ServerSettings;
@@ -643,7 +646,7 @@ public:
     void setClientInterface(ClientInfo::Interface interface);
     void setClientVersion(UInt64 client_version_major, UInt64 client_version_minor, UInt64 client_version_patch, unsigned client_tcp_protocol_version);
     void setClientConnectionId(uint32_t connection_id);
-    void setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer, const Poco::Net::NameValueCollection & http_headers = {});
+    void setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer);
     void setForwardedFor(const String & forwarded_for);
     void setQueryKind(ClientInfo::QueryKind query_kind);
     void setQueryKindInitial();
@@ -802,8 +805,9 @@ public:
 
     const ExternalUserDefinedExecutableFunctionsLoader & getExternalUserDefinedExecutableFunctionsLoader() const;
     ExternalUserDefinedExecutableFunctionsLoader & getExternalUserDefinedExecutableFunctionsLoader();
-    const IUserDefinedSQLObjectsLoader & getUserDefinedSQLObjectsLoader() const;
-    IUserDefinedSQLObjectsLoader & getUserDefinedSQLObjectsLoader();
+    const IUserDefinedSQLObjectsStorage & getUserDefinedSQLObjectsStorage() const;
+    IUserDefinedSQLObjectsStorage & getUserDefinedSQLObjectsStorage();
+    void setUserDefinedSQLObjectsStorage(std::unique_ptr<IUserDefinedSQLObjectsStorage> storage);
     void loadOrReloadUserDefinedExecutableFunctions(const Poco::Util::AbstractConfiguration & config);
 
 #if USE_NLP
@@ -843,6 +847,9 @@ public:
     void setHTTPHeaderFilter(const Poco::Util::AbstractConfiguration & config);
     const HTTPHeaderFilter & getHTTPHeaderFilter() const;
 
+    void setMaxTableNumToWarn(size_t max_table_to_warn);
+    void setMaxDatabaseNumToWarn(size_t max_database_to_warn);
+    void setMaxPartNumToWarn(size_t max_part_to_warn);
     /// The port that the server listens for executing SQL queries.
     UInt16 getTCPPort() const;
 
@@ -916,6 +923,9 @@ public:
     ReplicatedFetchList & getReplicatedFetchList();
     const ReplicatedFetchList & getReplicatedFetchList() const;
 
+    RefreshSet & getRefreshSet();
+    const RefreshSet & getRefreshSet() const;
+
     /// If the current session is expired at the time of the call, synchronously creates and returns a new session with the startNewSession() call.
     /// If no ZooKeeper configured, throws an exception.
     std::shared_ptr<zkutil::ZooKeeper> getZooKeeper() const;
@@ -953,8 +963,6 @@ public:
     // Reload Zookeeper
     void reloadZooKeeperIfChanged(const ConfigurationPtr & config) const;
 
-    void reloadQueryMaskingRulesIfChanged(const ConfigurationPtr & config) const;
-
     void setSystemZooKeeperLogAfterInitializationIfNeeded();
 
     /// --- Caches ------------------------------------------------------------------------------------------
@@ -1025,6 +1033,7 @@ public:
     std::shared_ptr<Cluster> getCluster(const std::string & cluster_name) const;
     std::shared_ptr<Cluster> tryGetCluster(const std::string & cluster_name) const;
     void setClustersConfig(const ConfigurationPtr & config, bool enable_discovery = false, const String & config_name = "remote_servers");
+    size_t getClustersVersion() const;
 
     void startClusterDiscovery();
 
@@ -1078,17 +1087,14 @@ public:
     /// Prevents DROP TABLE if its size is greater than max_size (50GB by default, max_size=0 turn off this check)
     void setMaxTableSizeToDrop(size_t max_size);
     size_t getMaxTableSizeToDrop() const;
-    void setClientHTTPHeaderForbiddenHeaders(const String & forbidden_headers);
-    /// Return the forbiddent headers that users can't get via getClientHTTPHeader function
-    const std::unordered_set<String> & getClientHTTPHeaderForbiddenHeaders() const;
-    void setAllowGetHTTPHeaderFunction(bool allow_get_http_header_function);
-    bool allowGetHTTPHeaderFunction() const;
     void checkTableCanBeDropped(const String & database, const String & table, const size_t & table_size) const;
+    void checkTableCanBeDropped(const String & database, const String & table, const size_t & table_size, const size_t & max_table_size_to_drop) const;
 
     /// Prevents DROP PARTITION if its size is greater than max_size (50GB by default, max_size=0 turn off this check)
     void setMaxPartitionSizeToDrop(size_t max_size);
     size_t getMaxPartitionSizeToDrop() const;
     void checkPartitionCanBeDropped(const String & database, const String & table, const size_t & partition_size) const;
+    void checkPartitionCanBeDropped(const String & database, const String & table, const size_t & partition_size, const size_t & max_partition_size_to_drop) const;
 
     /// Lets you select the compression codec according to the conditions described in the configuration file.
     std::shared_ptr<ICompressionCodec> chooseCompressionCodec(size_t part_size, double part_size_ratio) const;
@@ -1208,14 +1214,18 @@ public:
 
     /// Background executors related methods
     void initializeBackgroundExecutorsIfNeeded();
-    bool areBackgroundExecutorsInitialized();
+    bool areBackgroundExecutorsInitialized() const;
 
     MergeMutateBackgroundExecutorPtr getMergeMutateExecutor() const;
     OrdinaryBackgroundExecutorPtr getMovesExecutor() const;
     OrdinaryBackgroundExecutorPtr getFetchesExecutor() const;
     OrdinaryBackgroundExecutorPtr getCommonExecutor() const;
+    PooledSessionFactoryPtr getCommonFetchesSessionFactory() const;
 
     IAsynchronousReader & getThreadPoolReader(FilesystemReaderType type) const;
+#if USE_LIBURING
+    IOUringReader & getIOURingReader() const;
+#endif
 
     std::shared_ptr<AsyncReadCounters> getAsyncReadCounters() const;
 
@@ -1228,7 +1238,7 @@ public:
     WriteSettings getWriteSettings() const;
 
     /** There are multiple conditions that have to be met to be able to use parallel replicas */
-    bool canUseParallelReplicas() const;
+    bool canUseTaskBasedParallelReplicas() const;
     bool canUseParallelReplicasOnInitiator() const;
     bool canUseParallelReplicasOnFollower() const;
 
diff --git a/src/Interpreters/CrashLog.cpp b/src/Interpreters/CrashLog.cpp
index 6b966445580..7b8a87b7918 100644
--- a/src/Interpreters/CrashLog.cpp
+++ b/src/Interpreters/CrashLog.cpp
@@ -1,5 +1,7 @@
+#include <base/getFQDNOrHostName.h>
 #include <Interpreters/CrashLog.h>
 #include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDate.h>
@@ -21,6 +23,7 @@ NamesAndTypesList CrashLogElement::getNamesAndTypes()
 {
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"timestamp_ns", std::make_shared<DataTypeUInt64>()},
@@ -39,6 +42,7 @@ void CrashLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
     columns[i++]->insert(timestamp_ns);
diff --git a/src/Interpreters/DDLWorker.cpp b/src/Interpreters/DDLWorker.cpp
index de24dea1857..c0611dfaf7d 100644
--- a/src/Interpreters/DDLWorker.cpp
+++ b/src/Interpreters/DDLWorker.cpp
@@ -614,7 +614,7 @@ void DDLWorker::processTask(DDLTaskBase & task, const ZooKeeperPtr & zookeeper)
         {
             /// Connection has been lost and now we are retrying,
             /// but our previous ephemeral node still exists.
-            zookeeper->handleEphemeralNodeExistence(active_node_path, canary_value);
+            zookeeper->deleteEphemeralNodeIfContentMatches(active_node_path, canary_value);
         }
 
         zookeeper->create(active_node_path, canary_value, zkutil::CreateMode::Ephemeral);
diff --git a/src/Interpreters/DatabaseCatalog.cpp b/src/Interpreters/DatabaseCatalog.cpp
index c388ade9062..fc1975e8c86 100644
--- a/src/Interpreters/DatabaseCatalog.cpp
+++ b/src/Interpreters/DatabaseCatalog.cpp
@@ -331,7 +331,7 @@ DatabaseAndTable DatabaseCatalog::getTableImpl(
     if (!table_id)
     {
         if (exception)
-            exception->emplace(ErrorCodes::UNKNOWN_TABLE, "Cannot find table: StorageID is empty");
+            exception->emplace(Exception(ErrorCodes::UNKNOWN_TABLE, "Cannot find table: StorageID is empty"));
         return {};
     }
 
diff --git a/src/Interpreters/DatabaseCatalog.h b/src/Interpreters/DatabaseCatalog.h
index ee5d0b84b23..6d8fd84557c 100644
--- a/src/Interpreters/DatabaseCatalog.h
+++ b/src/Interpreters/DatabaseCatalog.h
@@ -30,29 +30,6 @@ namespace fs = std::filesystem;
 namespace DB
 {
 
-class TableNameHints : public IHints<>
-{
-public:
-    TableNameHints(ConstDatabasePtr database_, ContextPtr context_)
-        : context(context_),
-        database(database_)
-    {
-    }
-    Names getAllRegisteredNames() const override
-    {
-        Names result;
-        if (database)
-        {
-            for (auto table_it = database->getTablesIterator(context); table_it->isValid(); table_it->next())
-                result.emplace_back(table_it->name());
-        }
-        return result;
-    }
-private:
-    ContextPtr context;
-    ConstDatabasePtr database;
-};
-
 class IDatabase;
 class Exception;
 class ColumnsDescription;
@@ -392,6 +369,68 @@ private:
     static constexpr time_t DBMS_DEFAULT_DISK_RELOAD_PERIOD_SEC = 5;
 };
 
+class TableNameHints : public IHints<>
+{
+public:
+    TableNameHints(ConstDatabasePtr database_, ContextPtr context_)
+        : context(context_),
+        database(database_)
+    {
+    }
+
+    /// getHintForTable tries to get a hint for the provided table_name in the provided
+    /// database. If the results are empty, it goes for extended hints for the table
+    /// with getExtendedHintForTable which looks for the table name in every database that's
+    /// available in the database catalog. It finally returns a single hint which is the database
+    /// name and table_name pair which is similar to the table_name provided. Perhaps something to
+    /// consider is should we return more than one pair of hint?
+    std::pair<String, String> getHintForTable(const String & table_name) const
+    {
+        auto results = this->getHints(table_name, getAllRegisteredNames());
+        if (results.empty())
+            return getExtendedHintForTable(table_name);
+        return std::make_pair(database->getDatabaseName(), results[0]);
+    }
+
+    /// getExtendedHintsForTable tries to get hint for the given table_name across all
+    /// the databases that are available in the database catalog.
+    std::pair<String, String> getExtendedHintForTable(const String & table_name) const
+    {
+        /// load all available databases from the DatabaseCatalog instance
+        auto & database_catalog = DatabaseCatalog::instance();
+        auto all_databases = database_catalog.getDatabases();
+
+        for (const auto & [db_name, db] : all_databases)
+        {
+            /// this case should be covered already by getHintForTable
+            if (db_name == database->getDatabaseName())
+                continue;
+
+            TableNameHints hints(db, context);
+            auto results = hints.getHints(table_name);
+
+            /// if the results are not empty, return the first instance of the table_name
+            /// and the corresponding database_name that was found.
+            if (!results.empty())
+                return std::make_pair(db_name, results[0]);
+        }
+        return {};
+    }
+
+    Names getAllRegisteredNames() const override
+    {
+        Names result;
+        if (database)
+            for (auto table_it = database->getTablesIterator(context); table_it->isValid(); table_it->next())
+                result.emplace_back(table_it->name());
+        return result;
+    }
+
+private:
+    ContextPtr context;
+    ConstDatabasePtr database;
+};
+
 
 /// This class is useful when creating a table or database.
 /// Usually we create IStorage/IDatabase object first and then add it to IDatabase/DatabaseCatalog.
diff --git a/src/Interpreters/EmbeddedDictionaries.h b/src/Interpreters/EmbeddedDictionaries.h
index 674b3a7f01e..e71098636fe 100644
--- a/src/Interpreters/EmbeddedDictionaries.h
+++ b/src/Interpreters/EmbeddedDictionaries.h
@@ -12,14 +12,13 @@
 
 namespace Poco { class Logger; namespace Util { class AbstractConfiguration; } }
 
+namespace DB
+{
+
 class RegionsHierarchies;
 class RegionsNames;
 class GeoDictionariesLoader;
 
-
-namespace DB
-{
-
 /// Metrica's Dictionaries which can be used in functions.
 
 class EmbeddedDictionaries : WithContext
diff --git a/src/Interpreters/ExpressionAnalyzer.cpp b/src/Interpreters/ExpressionAnalyzer.cpp
index 3b389dcf61e..969c57535f9 100644
--- a/src/Interpreters/ExpressionAnalyzer.cpp
+++ b/src/Interpreters/ExpressionAnalyzer.cpp
@@ -56,6 +56,7 @@
 #include <Core/Names.h>
 #include <Core/NamesAndTypes.h>
 #include <Common/logger_useful.h>
+#include <Interpreters/PasteJoin.h>
 #include <QueryPipeline/SizeLimits.h>
 
 
@@ -858,11 +859,8 @@ const ASTSelectQuery * ExpressionAnalyzer::getSelectQuery() const
 
 bool ExpressionAnalyzer::isRemoteStorage() const
 {
-    const Settings & csettings = getContext()->getSettingsRef();
     // Consider any storage used in parallel replicas as remote, so the query is executed in multiple servers
-    const bool enable_parallel_processing_of_joins
-        = csettings.max_parallel_replicas > 1 && csettings.allow_experimental_parallel_reading_from_replicas > 0;
-    return syntax->is_remote_storage || enable_parallel_processing_of_joins;
+    return syntax->is_remote_storage || getContext()->canUseTaskBasedParallelReplicas();
 }
 
 const ASTSelectQuery * SelectQueryExpressionAnalyzer::getAggregatingQuery() const
@@ -954,6 +952,9 @@ static std::shared_ptr<IJoin> tryCreateJoin(
     std::unique_ptr<QueryPlan> & joined_plan,
     ContextPtr context)
 {
+    if (analyzed_join->kind() == JoinKind::Paste)
+        return std::make_shared<PasteJoin>(analyzed_join, right_sample_block);
+
     if (algorithm == JoinAlgorithm::DIRECT || algorithm == JoinAlgorithm::DEFAULT)
     {
         JoinPtr direct_join = tryKeyValueJoin(analyzed_join, right_sample_block);
diff --git a/src/Interpreters/FilesystemCacheLog.cpp b/src/Interpreters/FilesystemCacheLog.cpp
index b660db064d1..f8012925b8c 100644
--- a/src/Interpreters/FilesystemCacheLog.cpp
+++ b/src/Interpreters/FilesystemCacheLog.cpp
@@ -1,5 +1,7 @@
+#include <base/getFQDNOrHostName.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeMap.h>
@@ -34,6 +36,7 @@ NamesAndTypesList FilesystemCacheLogElement::getNamesAndTypes()
     };
 
     return {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"query_id", std::make_shared<DataTypeString>()},
@@ -54,6 +57,7 @@ void FilesystemCacheLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
 
diff --git a/src/Interpreters/FilesystemReadPrefetchesLog.cpp b/src/Interpreters/FilesystemReadPrefetchesLog.cpp
index d1cc61b94ba..3a26f069b5f 100644
--- a/src/Interpreters/FilesystemReadPrefetchesLog.cpp
+++ b/src/Interpreters/FilesystemReadPrefetchesLog.cpp
@@ -1,6 +1,8 @@
+#include <base/getFQDNOrHostName.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeDateTime64.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <Interpreters/FilesystemReadPrefetchesLog.h>
@@ -12,6 +14,7 @@ namespace DB
 NamesAndTypesList FilesystemReadPrefetchesLogElement::getNamesAndTypes()
 {
     return {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"query_id", std::make_shared<DataTypeString>()},
@@ -33,6 +36,7 @@ void FilesystemReadPrefetchesLogElement::appendToBlock(MutableColumns & columns)
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
     columns[i++]->insert(query_id);
diff --git a/src/Interpreters/GraceHashJoin.cpp b/src/Interpreters/GraceHashJoin.cpp
index 89ea3a326cc..26d666a8913 100644
--- a/src/Interpreters/GraceHashJoin.cpp
+++ b/src/Interpreters/GraceHashJoin.cpp
@@ -6,6 +6,7 @@
 #include <Interpreters/TemporaryDataOnDisk.h>
 
 #include <Compression/CompressedWriteBuffer.h>
+#include <Common/formatReadable.h>
 #include <Common/logger_useful.h>
 #include <Common/thread_local_rng.h>
 
@@ -271,7 +272,7 @@ GraceHashJoin::GraceHashJoin(
     , left_key_names(table_join->getOnlyClause().key_names_left)
     , right_key_names(table_join->getOnlyClause().key_names_right)
     , tmp_data(std::make_unique<TemporaryDataOnDisk>(tmp_data_, CurrentMetrics::TemporaryFilesForJoin))
-    , hash_join(makeInMemoryJoin())
+    , hash_join(makeInMemoryJoin("grace0"))
     , hash_join_sample_block(hash_join->savedBlockSample())
 {
     if (!GraceHashJoin::isSupported(table_join))
@@ -424,8 +425,10 @@ void GraceHashJoin::initialize(const Block & sample_block)
 {
     left_sample_block = sample_block.cloneEmpty();
     output_sample_block = left_sample_block.cloneEmpty();
-    ExtraBlockPtr not_processed;
+    ExtraBlockPtr not_processed = nullptr;
     hash_join->joinBlock(output_sample_block, not_processed);
+    if (not_processed)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unhandled not processed block in GraceHashJoin");
     initBuckets();
 }
 
@@ -447,9 +450,6 @@ void GraceHashJoin::joinBlock(Block & block, std::shared_ptr<ExtraBlock> & not_p
     block = std::move(blocks[current_bucket->idx]);
 
     hash_join->joinBlock(block, not_processed);
-    if (not_processed)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Unhandled not processed block in GraceHashJoin");
-
     flushBlocksToBuckets<JoinTableSide::Left>(blocks, buckets);
 }
 
@@ -528,6 +528,29 @@ public:
 
     Block nextImpl() override
     {
+        ExtraBlockPtr not_processed = nullptr;
+
+        {
+            std::lock_guard lock(extra_block_mutex);
+            if (!not_processed_blocks.empty())
+            {
+                not_processed = std::move(not_processed_blocks.front());
+                not_processed_blocks.pop_front();
+            }
+        }
+
+        if (not_processed)
+        {
+            Block block = std::move(not_processed->block);
+            hash_join->joinBlock(block, not_processed);
+            if (not_processed)
+            {
+                std::lock_guard lock(extra_block_mutex);
+                not_processed_blocks.emplace_back(std::move(not_processed));
+            }
+            return block;
+        }
+
         Block block;
         size_t num_buckets = buckets.size();
         size_t current_idx = buckets[current_bucket]->idx;
@@ -565,12 +588,12 @@ public:
             }
         } while (block.rows() == 0);
 
-        ExtraBlockPtr not_processed;
         hash_join->joinBlock(block, not_processed);
-
         if (not_processed)
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Unsupported hash join type");
-
+        {
+            std::lock_guard lock(extra_block_mutex);
+            not_processed_blocks.emplace_back(std::move(not_processed));
+        }
         return block;
     }
 
@@ -582,6 +605,9 @@ public:
 
     Names left_key_names;
     Names right_key_names;
+
+    std::mutex extra_block_mutex;
+    std::list<ExtraBlockPtr> not_processed_blocks TSA_GUARDED_BY(extra_block_mutex);
 };
 
 IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
@@ -611,7 +637,7 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
             continue;
         }
 
-        hash_join = makeInMemoryJoin(prev_keys_num);
+        hash_join = makeInMemoryJoin(fmt::format("grace{}", bucket_idx), prev_keys_num);
         auto right_reader = current_bucket->startJoining();
         size_t num_rows = 0; /// count rows that were written and rehashed
         while (Block block = right_reader.read())
@@ -632,10 +658,9 @@ IBlocksStreamPtr GraceHashJoin::getDelayedBlocks()
     return nullptr;
 }
 
-GraceHashJoin::InMemoryJoinPtr GraceHashJoin::makeInMemoryJoin(size_t reserve_num)
+GraceHashJoin::InMemoryJoinPtr GraceHashJoin::makeInMemoryJoin(const String & bucket_id, size_t reserve_num)
 {
-    auto ret = std::make_unique<InMemoryJoin>(table_join, right_sample_block, any_take_last_row, reserve_num);
-    return std::move(ret);
+    return std::make_unique<HashJoin>(table_join, right_sample_block, any_take_last_row, reserve_num, bucket_id);
 }
 
 Block GraceHashJoin::prepareRightBlock(const Block & block)
@@ -661,7 +686,7 @@ void GraceHashJoin::addBlockToJoinImpl(Block block)
     {
         std::lock_guard lock(hash_join_mutex);
         if (!hash_join)
-            hash_join = makeInMemoryJoin();
+            hash_join = makeInMemoryJoin(fmt::format("grace{}", bucket_index));
 
         // buckets size has been changed in other threads. Need to scatter current_block again.
         // rehash could only happen under hash_join_mutex's scope.
@@ -705,7 +730,7 @@ void GraceHashJoin::addBlockToJoinImpl(Block block)
                 current_block = concatenateBlocks(current_blocks);
         }
 
-        hash_join = makeInMemoryJoin(prev_keys_num);
+        hash_join = makeInMemoryJoin(fmt::format("grace{}", bucket_index), prev_keys_num);
 
         if (current_block.rows() > 0)
             hash_join->addBlockToJoin(current_block, /* check_limits = */ false);
diff --git a/src/Interpreters/GraceHashJoin.h b/src/Interpreters/GraceHashJoin.h
index 44949440467..2cadeee10b9 100644
--- a/src/Interpreters/GraceHashJoin.h
+++ b/src/Interpreters/GraceHashJoin.h
@@ -44,9 +44,8 @@ class GraceHashJoin final : public IJoin
 {
     class FileBucket;
     class DelayedBlocks;
-    using InMemoryJoin = HashJoin;
 
-    using InMemoryJoinPtr = std::shared_ptr<InMemoryJoin>;
+    using InMemoryJoinPtr = std::shared_ptr<HashJoin>;
 
 public:
     using BucketPtr = std::shared_ptr<FileBucket>;
@@ -91,7 +90,7 @@ public:
 private:
     void initBuckets();
     /// Create empty join for in-memory processing.
-    InMemoryJoinPtr makeInMemoryJoin(size_t reserve_num = 0);
+    InMemoryJoinPtr makeInMemoryJoin(const String & bucket_id, size_t reserve_num = 0);
 
     /// Add right table block to the @join. Calls @rehash on overflow.
     void addBlockToJoinImpl(Block block);
diff --git a/src/Interpreters/HashJoin.cpp b/src/Interpreters/HashJoin.cpp
index dcc90eb54d1..a84e1ec2175 100644
--- a/src/Interpreters/HashJoin.cpp
+++ b/src/Interpreters/HashJoin.cpp
@@ -30,9 +30,10 @@
 #include <Common/Exception.h>
 #include <Common/typeid_cast.h>
 #include <Common/assert_cast.h>
+#include <Common/formatReadable.h>
 
 #include <Functions/FunctionHelpers.h>
-
+#include <Interpreters/castColumn.h>
 
 namespace DB
 {
@@ -217,7 +218,7 @@ static void correctNullabilityInplace(ColumnWithTypeAndName & column, bool nulla
     }
 }
 
-static void correctNullabilityInplace(ColumnWithTypeAndName & column, bool nullable, const ColumnUInt8 & negative_null_map)
+static void correctNullabilityInplace(ColumnWithTypeAndName & column, bool nullable, const IColumn::Filter & negative_null_map)
 {
     if (nullable)
     {
@@ -233,7 +234,8 @@ static void correctNullabilityInplace(ColumnWithTypeAndName & column, bool nulla
         JoinCommon::removeColumnNullability(column);
 }
 
-HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_, bool any_take_last_row_, size_t reserve_num)
+HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_,
+                   bool any_take_last_row_, size_t reserve_num, const String & instance_id_)
     : table_join(table_join_)
     , kind(table_join->kind())
     , strictness(table_join->strictness())
@@ -241,10 +243,11 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
     , asof_inequality(table_join->getAsofInequality())
     , data(std::make_shared<RightTableData>())
     , right_sample_block(right_sample_block_)
+    , instance_log_id(!instance_id_.empty() ? "(" + instance_id_ + ") " : "")
     , log(&Poco::Logger::get("HashJoin"))
 {
-    LOG_DEBUG(log, "({}) Datatype: {}, kind: {}, strictness: {}, right header: {}", fmt::ptr(this), data->type, kind, strictness, right_sample_block.dumpStructure());
-    LOG_DEBUG(log, "({}) Keys: {}", fmt::ptr(this), TableJoin::formatClauses(table_join->getClauses(), true));
+    LOG_TRACE(log, "{}Keys: {}, datatype: {}, kind: {}, strictness: {}, right header: {}",
+        instance_log_id, TableJoin::formatClauses(table_join->getClauses(), true), data->type, kind, strictness, right_sample_block.dumpStructure());
 
     if (isCrossOrComma(kind))
     {
@@ -254,7 +257,8 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
     else if (table_join->getClauses().empty())
     {
         data->type = Type::EMPTY;
-        sample_block_with_columns_to_add = right_sample_block;
+        /// We might need to insert default values into the right columns, materialize them
+        sample_block_with_columns_to_add = materializeBlock(right_sample_block);
     }
     else if (table_join->oneDisjunct())
     {
@@ -268,8 +272,9 @@ HashJoin::HashJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_s
         sample_block_with_columns_to_add = right_table_keys = materializeBlock(right_sample_block);
     }
 
-    JoinCommon::convertToFullColumnsInplace(right_table_keys);
+    materializeBlockInplace(right_table_keys);
     initRightBlockStructure(data->sample_block);
+    data->sample_block = prepareRightBlock(data->sample_block);
 
     JoinCommon::createMissedColumns(sample_block_with_columns_to_add);
 
@@ -372,10 +377,20 @@ HashJoin::Type HashJoin::chooseMethod(JoinKind kind, const ColumnRawPtrs & key_c
         return Type::keys256;
 
     /// If there is single string key, use hash table of it's values.
-    if (keys_size == 1
-        && (typeid_cast<const ColumnString *>(key_columns[0])
-            || (isColumnConst(*key_columns[0]) && typeid_cast<const ColumnString *>(&assert_cast<const ColumnConst *>(key_columns[0])->getDataColumn()))))
-        return Type::key_string;
+    if (keys_size == 1)
+    {
+        auto is_string_column = [](const IColumn * column_ptr) -> bool
+        {
+            if (const auto * lc_column_ptr = typeid_cast<const ColumnLowCardinality *>(column_ptr))
+                return typeid_cast<const ColumnString *>(lc_column_ptr->getDictionary().getNestedColumn().get());
+            return typeid_cast<const ColumnString *>(column_ptr);
+        };
+
+        const auto * key_column = key_columns[0];
+        if (is_string_column(key_column) ||
+            (isColumnConst(*key_column) && is_string_column(assert_cast<const ColumnConst *>(key_column)->getDataColumnPtr().get())))
+            return Type::key_string;
+    }
 
     if (keys_size == 1 && typeid_cast<const ColumnFixedString *>(key_columns[0]))
         return Type::key_fixed_string;
@@ -790,7 +805,13 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
 
     size_t rows = source_block.rows();
 
-    ColumnPtrMap all_key_columns = JoinCommon::materializeColumnsInplaceMap(source_block, table_join->getAllNames(JoinTableSide::Right));
+    const auto & right_key_names = table_join->getAllNames(JoinTableSide::Right);
+    ColumnPtrMap all_key_columns(right_key_names.size());
+    for (const auto & column_name : right_key_names)
+    {
+        const auto & column = source_block.getByName(column_name).column;
+        all_key_columns[column_name] = recursiveRemoveSparse(column->convertToFullColumnIfConst())->convertToFullColumnIfLowCardinality();
+    }
 
     Block block_to_save = prepareRightBlock(source_block);
     if (shrink_blocks)
@@ -803,6 +824,8 @@ bool HashJoin::addBlockToJoin(const Block & source_block_, bool check_limits)
             throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "addBlockToJoin called when HashJoin locked to prevent updates");
 
         data->blocks_allocated_size += block_to_save.allocatedBytes();
+
+        assertBlocksHaveEqualStructure(data->sample_block, block_to_save, "joined block");
         data->blocks.emplace_back(std::move(block_to_save));
         Block * stored_block = &data->blocks.back();
 
@@ -1011,16 +1034,15 @@ public:
     };
 
     AddedColumns(
+        const Block & left_block,
         const Block & block_with_columns_to_add,
-        const Block & block,
         const Block & saved_block_sample,
         const HashJoin & join,
         std::vector<JoinOnKeyColumns> && join_on_keys_,
         bool is_asof_join,
         bool is_join_get_)
         : join_on_keys(join_on_keys_)
-        , rows_to_add(block.rows())
-        , sample_block(saved_block_sample)
+        , rows_to_add(left_block.rows())
         , is_join_get(is_join_get_)
     {
         size_t num_columns_to_add = block_with_columns_to_add.columns();
@@ -1037,7 +1059,7 @@ public:
             /// because it uses not qualified right block column names
             auto qualified_name = join.getTableJoin().renamedRightColumnName(src_column.name);
             /// Don't insert column if it's in left block
-            if (!block.has(qualified_name))
+            if (!left_block.has(qualified_name))
                 addColumn(src_column, qualified_name);
         }
 
@@ -1051,6 +1073,17 @@ public:
 
         for (auto & tn : type_name)
             right_indexes.push_back(saved_block_sample.getPositionByName(tn.name));
+
+        nullable_column_ptrs.resize(right_indexes.size(), nullptr);
+        for (size_t j = 0; j < right_indexes.size(); ++j)
+        {
+            /** If it's joinGetOrNull, we will have nullable columns in result block
+              * even if right column is not nullable in storage (saved_block_sample).
+              */
+            const auto & saved_column = saved_block_sample.getByPosition(right_indexes[j]).column;
+            if (columns[j]->isNullable() && !saved_column->isNullable())
+                nullable_column_ptrs[j] = typeid_cast<ColumnNullable *>(columns[j].get());
+        }
     }
 
     size_t size() const { return columns.size(); }
@@ -1060,33 +1093,6 @@ public:
         return ColumnWithTypeAndName(std::move(columns[i]), type_name[i].type, type_name[i].qualified_name);
     }
 
-    static void assertBlockEqualsStructureUpToLowCard(const Block & lhs_block, const Block & rhs_block)
-    {
-        if (lhs_block.columns() != rhs_block.columns())
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Different number of columns in blocks [{}] and [{}]",
-                lhs_block.dumpStructure(), rhs_block.dumpStructure());
-
-        for (size_t i = 0; i < lhs_block.columns(); ++i)
-        {
-            const auto & lhs = lhs_block.getByPosition(i);
-            const auto & rhs = rhs_block.getByPosition(i);
-            if (lhs.name != rhs.name)
-                throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "Block structure mismatch: [{}] != [{}] ({} != {})",
-                    lhs_block.dumpStructure(), rhs_block.dumpStructure(), lhs.name, rhs.name);
-
-            const auto & ltype = recursiveRemoveLowCardinality(lhs.type);
-            const auto & rtype = recursiveRemoveLowCardinality(rhs.type);
-            if (!ltype->equals(*rtype))
-                throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "Block structure mismatch: [{}] != [{}] ({} != {})",
-                    lhs_block.dumpStructure(), rhs_block.dumpStructure(), ltype->getName(), rtype->getName());
-
-            const auto & lcol = recursiveRemoveLowCardinality(lhs.column);
-            const auto & rcol = recursiveRemoveLowCardinality(rhs.column);
-            if (lcol->getDataType() != rcol->getDataType())
-                throw DB::Exception(ErrorCodes::LOGICAL_ERROR, "Block structure mismatch: [{}] != [{}] ({} != {})",
-                    lhs_block.dumpStructure(), rhs_block.dumpStructure(), lcol->getDataType(), rcol->getDataType());
-        }
-    }
 
     template <bool has_defaults>
     void appendFromBlock(const Block & block, size_t row_num)
@@ -1095,38 +1101,50 @@ public:
             applyLazyDefaults();
 
 #ifndef NDEBUG
-        /// Like assertBlocksHaveEqualStructure but doesn't check low cardinality
-        assertBlockEqualsStructureUpToLowCard(sample_block, block);
-#else
-        UNUSED(assertBlockEqualsStructureUpToLowCard);
+        for (size_t j = 0; j < right_indexes.size(); ++j)
+        {
+            const auto * column_from_block = block.getByPosition(right_indexes[j]).column.get();
+            const auto * dest_column = columns[j].get();
+            if (auto * nullable_col = nullable_column_ptrs[j])
+            {
+                if (!is_join_get)
+                    throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Columns {} and {} can have different nullability only in joinGetOrNull",
+                        dest_column->getName(), column_from_block->getName());
+                dest_column = nullable_col->getNestedColumnPtr().get();
+            }
+            /** Using dest_column->structureEquals(*column_from_block) will not work for low cardinality columns,
+              * because dictionaries can be different, while calling insertFrom on them is safe, for example:
+              * ColumnLowCardinality(size = 0, UInt8(size = 0), ColumnUnique(size = 1, String(size = 1)))
+              * and
+              * ColumnLowCardinality(size = 0, UInt16(size = 0), ColumnUnique(size = 1, String(size = 1)))
+              */
+            if (typeid(*dest_column) != typeid(*column_from_block))
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Columns {} and {} have different types {} and {}",
+                    dest_column->getName(), column_from_block->getName(),
+                    demangle(typeid(*dest_column).name()), demangle(typeid(*column_from_block).name()));
+        }
 #endif
 
         if (is_join_get)
         {
-            /// If it's joinGetOrNull, we need to wrap not-nullable columns in StorageJoin.
-            for (size_t j = 0, size = right_indexes.size(); j < size; ++j)
+            size_t right_indexes_size = right_indexes.size();
+            for (size_t j = 0; j < right_indexes_size; ++j)
             {
                 const auto & column_from_block = block.getByPosition(right_indexes[j]);
-                if (auto * nullable_col = typeid_cast<ColumnNullable *>(columns[j].get());
-                    nullable_col && !column_from_block.column->isNullable())
+                if (auto * nullable_col = nullable_column_ptrs[j])
                     nullable_col->insertFromNotNullable(*column_from_block.column, row_num);
-                else if (auto * lowcard_col = typeid_cast<ColumnLowCardinality *>(columns[j].get());
-                         lowcard_col && !typeid_cast<const ColumnLowCardinality *>(column_from_block.column.get()))
-                    lowcard_col->insertFromFullColumn(*column_from_block.column, row_num);
                 else
                     columns[j]->insertFrom(*column_from_block.column, row_num);
             }
         }
         else
         {
-            for (size_t j = 0, size = right_indexes.size(); j < size; ++j)
+            size_t right_indexes_size = right_indexes.size();
+            for (size_t j = 0; j < right_indexes_size; ++j)
             {
                 const auto & column_from_block = block.getByPosition(right_indexes[j]);
-                if (auto * lowcard_col = typeid_cast<ColumnLowCardinality *>(columns[j].get());
-                    lowcard_col && !typeid_cast<const ColumnLowCardinality *>(column_from_block.column.get()))
-                    lowcard_col->insertFromFullColumn(*column_from_block.column, row_num);
-                else
-                    columns[j]->insertFrom(*column_from_block.column, row_num);
+                columns[j]->insertFrom(*column_from_block.column, row_num);
             }
         }
     }
@@ -1150,18 +1168,37 @@ public:
 
     std::vector<JoinOnKeyColumns> join_on_keys;
 
+    size_t max_joined_block_rows = 0;
     size_t rows_to_add;
     std::unique_ptr<IColumn::Offsets> offsets_to_replicate;
     bool need_filter = false;
+    IColumn::Filter filter;
+
+    void reserve(bool need_replicate)
+    {
+        if (!max_joined_block_rows)
+            return;
+
+        /// Do not allow big allocations when user set max_joined_block_rows to huge value
+        size_t reserve_size = std::min<size_t>(max_joined_block_rows, DEFAULT_BLOCK_SIZE * 2);
+
+        if (need_replicate)
+            /// Reserve 10% more space for columns, because some rows can be repeated
+            reserve_size = static_cast<size_t>(1.1 * reserve_size);
+
+        for (auto & column : columns)
+            column->reserve(reserve_size);
+    }
 
 private:
     std::vector<TypeAndName> type_name;
     MutableColumns columns;
+    std::vector<ColumnNullable *> nullable_column_ptrs;
+
     std::vector<size_t> right_indexes;
     size_t lazy_defaults_count = 0;
     /// for ASOF
     const IColumn * left_asof_key = nullptr;
-    Block sample_block;
 
     bool is_join_get;
 
@@ -1340,7 +1377,7 @@ void setUsed(IColumn::Filter & filter [[maybe_unused]], size_t pos [[maybe_unuse
 /// Joins right table columns which indexes are present in right_indexes using specified map.
 /// Makes filter (1 if row presented in right table) and returns offsets to replicate (for ALL JOINS).
 template <JoinKind KIND, JoinStrictness STRICTNESS, typename KeyGetter, typename Map, bool need_filter, bool multiple_disjuncts>
-NO_INLINE IColumn::Filter joinRightColumns(
+NO_INLINE size_t joinRightColumns(
     std::vector<KeyGetter> && key_getter_vector,
     const std::vector<const Map *> & mapv,
     AddedColumns & added_columns,
@@ -1349,9 +1386,8 @@ NO_INLINE IColumn::Filter joinRightColumns(
     constexpr JoinFeatures<KIND, STRICTNESS> join_features;
 
     size_t rows = added_columns.rows_to_add;
-    IColumn::Filter filter;
     if constexpr (need_filter)
-        filter = IColumn::Filter(rows, 0);
+        added_columns.filter = IColumn::Filter(rows, 0);
 
     Arena pool;
 
@@ -1359,9 +1395,20 @@ NO_INLINE IColumn::Filter joinRightColumns(
         added_columns.offsets_to_replicate = std::make_unique<IColumn::Offsets>(rows);
 
     IColumn::Offset current_offset = 0;
-
-    for (size_t i = 0; i < rows; ++i)
+    size_t max_joined_block_rows = added_columns.max_joined_block_rows;
+    size_t i = 0;
+    for (; i < rows; ++i)
     {
+        if constexpr (join_features.need_replication)
+        {
+            if (unlikely(current_offset > max_joined_block_rows))
+            {
+                added_columns.offsets_to_replicate->resize_assume_reserved(i);
+                added_columns.filter.resize_assume_reserved(i);
+                break;
+            }
+        }
+
         bool right_row_found = false;
 
         KnownRowsHolder<multiple_disjuncts> known_rows;
@@ -1386,7 +1433,7 @@ NO_INLINE IColumn::Filter joinRightColumns(
                     auto row_ref = mapped->findAsof(left_asof_key, i);
                     if (row_ref.block)
                     {
-                        setUsed<need_filter>(filter, i);
+                        setUsed<need_filter>(added_columns.filter, i);
                         if constexpr (multiple_disjuncts)
                             used_flags.template setUsed<join_features.need_flags, multiple_disjuncts>(row_ref.block, row_ref.row_num, 0);
                         else
@@ -1399,7 +1446,7 @@ NO_INLINE IColumn::Filter joinRightColumns(
                 }
                 else if constexpr (join_features.is_all_join)
                 {
-                    setUsed<need_filter>(filter, i);
+                    setUsed<need_filter>(added_columns.filter, i);
                     used_flags.template setUsed<join_features.need_flags, multiple_disjuncts>(find_result);
                     auto used_flags_opt = join_features.need_flags ? &used_flags : nullptr;
                     addFoundRowAll<Map, join_features.add_missing>(mapped, added_columns, current_offset, known_rows, used_flags_opt);
@@ -1411,7 +1458,7 @@ NO_INLINE IColumn::Filter joinRightColumns(
                     if (used_once)
                     {
                         auto used_flags_opt = join_features.need_flags ? &used_flags : nullptr;
-                        setUsed<need_filter>(filter, i);
+                        setUsed<need_filter>(added_columns.filter, i);
                         addFoundRowAll<Map, join_features.add_missing>(mapped, added_columns, current_offset, known_rows, used_flags_opt);
                     }
                 }
@@ -1422,7 +1469,7 @@ NO_INLINE IColumn::Filter joinRightColumns(
                     /// Use first appeared left key only
                     if (used_once)
                     {
-                        setUsed<need_filter>(filter, i);
+                        setUsed<need_filter>(added_columns.filter, i);
                         added_columns.appendFromBlock<join_features.add_missing>(*mapped.block, mapped.row_num);
                     }
 
@@ -1439,7 +1486,7 @@ NO_INLINE IColumn::Filter joinRightColumns(
                 }
                 else /// ANY LEFT, SEMI LEFT, old ANY (RightAny)
                 {
-                    setUsed<need_filter>(filter, i);
+                    setUsed<need_filter>(added_columns.filter, i);
                     used_flags.template setUsed<join_features.need_flags, multiple_disjuncts>(find_result);
                     added_columns.appendFromBlock<join_features.add_missing>(*mapped.block, mapped.row_num);
 
@@ -1454,7 +1501,7 @@ NO_INLINE IColumn::Filter joinRightColumns(
         if (!right_row_found)
         {
             if constexpr (join_features.is_anti_join && join_features.left)
-                setUsed<need_filter>(filter, i);
+                setUsed<need_filter>(added_columns.filter, i);
             addNotFoundRow<join_features.add_missing, join_features.need_replication>(added_columns, current_offset);
         }
 
@@ -1465,11 +1512,11 @@ NO_INLINE IColumn::Filter joinRightColumns(
     }
 
     added_columns.applyLazyDefaults();
-    return filter;
+    return i;
 }
 
 template <JoinKind KIND, JoinStrictness STRICTNESS, typename KeyGetter, typename Map, bool need_filter>
-IColumn::Filter joinRightColumnsSwitchMultipleDisjuncts(
+size_t joinRightColumnsSwitchMultipleDisjuncts(
     std::vector<KeyGetter> && key_getter_vector,
     const std::vector<const Map *> & mapv,
     AddedColumns & added_columns,
@@ -1481,7 +1528,7 @@ IColumn::Filter joinRightColumnsSwitchMultipleDisjuncts(
 }
 
 template <JoinKind KIND, JoinStrictness STRICTNESS, typename KeyGetter, typename Map>
-IColumn::Filter joinRightColumnsSwitchNullability(
+size_t joinRightColumnsSwitchNullability(
     std::vector<KeyGetter> && key_getter_vector,
     const std::vector<const Map *> & mapv,
     AddedColumns & added_columns,
@@ -1498,7 +1545,7 @@ IColumn::Filter joinRightColumnsSwitchNullability(
 }
 
 template <JoinKind KIND, JoinStrictness STRICTNESS, typename Maps>
-IColumn::Filter switchJoinRightColumns(
+size_t switchJoinRightColumns(
     const std::vector<const Maps *> & mapv,
     AddedColumns & added_columns,
     HashJoin::Type type,
@@ -1547,10 +1594,61 @@ IColumn::Filter switchJoinRightColumns(
     }
 }
 
+/** Since we do not store right key columns,
+  * this function is used to copy left key columns to right key columns.
+  * If the user requests some right columns, we just copy left key columns to right, since they are equal.
+  * Example: SELECT t1.key, t2.key FROM t1 FULL JOIN t2 ON t1.key = t2.key;
+  * In that case for matched rows in t2.key we will use values from t1.key.
+  * However, in some cases we might need to adjust the type of column, e.g. t1.key :: LowCardinality(String) and t2.key :: String
+  * Also, the nullability of the column might be different.
+  * Returns the right column after with necessary adjustments.
+  */
+ColumnWithTypeAndName copyLeftKeyColumnToRight(
+    const DataTypePtr & right_key_type, const String & renamed_right_column, const ColumnWithTypeAndName & left_column, const IColumn::Filter * null_map_filter = nullptr)
+{
+    ColumnWithTypeAndName right_column = left_column;
+    right_column.name = renamed_right_column;
+
+    if (null_map_filter)
+        right_column.column = JoinCommon::filterWithBlanks(right_column.column, *null_map_filter);
+
+    bool should_be_nullable = isNullableOrLowCardinalityNullable(right_key_type);
+    if (null_map_filter)
+        correctNullabilityInplace(right_column, should_be_nullable, *null_map_filter);
+    else
+        correctNullabilityInplace(right_column, should_be_nullable);
+
+    if (!right_column.type->equals(*right_key_type))
+    {
+        right_column.column = castColumnAccurate(right_column, right_key_type);
+        right_column.type = right_key_type;
+    }
+
+    right_column.column = right_column.column->convertToFullColumnIfConst();
+    return right_column;
+}
+
+/// Cut first num_rows rows from block in place and returns block with remaining rows
+Block sliceBlock(Block & block, size_t num_rows)
+{
+    size_t total_rows = block.rows();
+    if (num_rows >= total_rows)
+        return {};
+    size_t remaining_rows = total_rows - num_rows;
+    Block remaining_block = block.cloneEmpty();
+    for (size_t i = 0; i < block.columns(); ++i)
+    {
+        auto & col = block.getByPosition(i);
+        remaining_block.getByPosition(i).column = col.column->cut(num_rows, remaining_rows);
+        col.column = col.column->cut(0, num_rows);
+    }
+    return remaining_block;
+}
+
 } /// nameless
 
 template <JoinKind KIND, JoinStrictness STRICTNESS, typename Maps>
-void HashJoin::joinBlockImpl(
+Block HashJoin::joinBlockImpl(
     Block & block,
     const Block & block_with_columns_to_add,
     const std::vector<const Maps *> & maps_,
@@ -1582,8 +1680,8 @@ void HashJoin::joinBlockImpl(
       * For ASOF, the last column is used as the ASOF column
       */
     AddedColumns added_columns(
-        block_with_columns_to_add,
         block,
+        block_with_columns_to_add,
         savedBlockSample(),
         *this,
         std::move(join_on_keys),
@@ -1592,8 +1690,16 @@ void HashJoin::joinBlockImpl(
 
     bool has_required_right_keys = (required_right_keys.columns() != 0);
     added_columns.need_filter = join_features.need_filter || has_required_right_keys;
+    added_columns.max_joined_block_rows = table_join->maxJoinedBlockRows();
+    if (!added_columns.max_joined_block_rows)
+        added_columns.max_joined_block_rows = std::numeric_limits<size_t>::max();
+    else
+        added_columns.reserve(join_features.need_replication);
 
-    IColumn::Filter row_filter = switchJoinRightColumns<KIND, STRICTNESS>(maps_, added_columns, data->type, used_flags);
+    size_t num_joined = switchJoinRightColumns<KIND, STRICTNESS>(maps_, added_columns, data->type, used_flags);
+    /// Do not hold memory for join_on_keys anymore
+    added_columns.join_on_keys.clear();
+    Block remaining_block = sliceBlock(block, num_joined);
 
     for (size_t i = 0; i < added_columns.size(); ++i)
         block.insert(added_columns.moveColumn(i));
@@ -1604,7 +1710,7 @@ void HashJoin::joinBlockImpl(
     {
         /// If ANY INNER | RIGHT JOIN - filter all the columns except the new ones.
         for (size_t i = 0; i < existing_columns; ++i)
-            block.safeGetByPosition(i).column = block.safeGetByPosition(i).column->filter(row_filter, -1);
+            block.safeGetByPosition(i).column = block.safeGetByPosition(i).column->filter(added_columns.filter, -1);
 
         /// Add join key columns from right block if needed using value from left table because of equality
         for (size_t i = 0; i < required_right_keys.columns(); ++i)
@@ -1613,31 +1719,19 @@ void HashJoin::joinBlockImpl(
             // renamed ???
             if (!block.findByName(right_key.name))
             {
-                const auto & left_name = required_right_keys_sources[i];
-
                 /// asof column is already in block.
                 if (join_features.is_asof_join && right_key.name == table_join->getOnlyClause().key_names_right.back())
                     continue;
 
-                const auto & col = block.getByName(left_name);
-                bool is_nullable = JoinCommon::isNullable(right_key.type);
-                auto right_col_name = getTableJoin().renamedRightColumnName(right_key.name);
-                ColumnWithTypeAndName right_col(col.column, col.type, right_col_name);
-                if (right_col.type->lowCardinality() != right_key.type->lowCardinality())
-                    JoinCommon::changeLowCardinalityInplace(right_col);
-                correctNullabilityInplace(right_col, is_nullable);
+                const auto & left_column = block.getByName(required_right_keys_sources[i]);
+                const auto & right_col_name = getTableJoin().renamedRightColumnName(right_key.name);
+                auto right_col = copyLeftKeyColumnToRight(right_key.type, right_col_name, left_column);
                 block.insert(std::move(right_col));
             }
         }
     }
     else if (has_required_right_keys)
     {
-        /// Some trash to represent IColumn::Filter as ColumnUInt8 needed for ColumnNullable::applyNullMap()
-        auto null_map_filter_ptr = ColumnUInt8::create();
-        ColumnUInt8 & null_map_filter = assert_cast<ColumnUInt8 &>(*null_map_filter_ptr);
-        null_map_filter.getData().swap(row_filter);
-        const IColumn::Filter & filter = null_map_filter.getData();
-
         /// Add join key columns from right block if needed.
         for (size_t i = 0; i < required_right_keys.columns(); ++i)
         {
@@ -1645,21 +1739,12 @@ void HashJoin::joinBlockImpl(
             auto right_col_name = getTableJoin().renamedRightColumnName(right_key.name);
             if (!block.findByName(right_col_name))
             {
-                const auto & left_name = required_right_keys_sources[i];
-
                 /// asof column is already in block.
                 if (join_features.is_asof_join && right_key.name == table_join->getOnlyClause().key_names_right.back())
                     continue;
 
-                const auto & col = block.getByName(left_name);
-                bool is_nullable = JoinCommon::isNullable(right_key.type);
-
-                ColumnPtr thin_column = JoinCommon::filterWithBlanks(col.column, filter);
-
-                ColumnWithTypeAndName right_col(thin_column, col.type, right_col_name);
-                if (right_col.type->lowCardinality() != right_key.type->lowCardinality())
-                    JoinCommon::changeLowCardinalityInplace(right_col);
-                correctNullabilityInplace(right_col, is_nullable, null_map_filter);
+                const auto & left_column = block.getByName(required_right_keys_sources[i]);
+                auto right_col = copyLeftKeyColumnToRight(right_key.type, right_col_name, left_column, &added_columns.filter);
                 block.insert(std::move(right_col));
 
                 if constexpr (join_features.need_replication)
@@ -1680,6 +1765,8 @@ void HashJoin::joinBlockImpl(
         for (size_t pos : right_keys_to_replicate)
             block.safeGetByPosition(pos).column = block.safeGetByPosition(pos).column->replicate(*offsets_to_replicate);
     }
+
+    return remaining_block;
 }
 
 void HashJoin::joinBlockImplCross(Block & block, ExtraBlockPtr & not_processed) const
@@ -1813,7 +1900,7 @@ ColumnWithTypeAndName HashJoin::joinGet(const Block & block, const Block & block
     std::vector<const MapsOne *> maps_vector;
     maps_vector.push_back(&std::get<MapsOne>(data->maps[0]));
     joinBlockImpl<JoinKind::Left, JoinStrictness::Any>(
-        keys, block_with_columns_to_add, maps_vector, true);
+        keys, block_with_columns_to_add, maps_vector, /* is_join_get = */ true);
     return keys.getByPosition(keys.columns() - 1);
 }
 
@@ -1856,7 +1943,11 @@ void HashJoin::joinBlock(Block & block, ExtraBlockPtr & not_processed)
 
         if (joinDispatch(kind, strictness, maps_vector, [&](auto kind_, auto strictness_, auto & maps_vector_)
         {
-            joinBlockImpl<kind_, strictness_>(block, sample_block_with_columns_to_add, maps_vector_);
+            Block remaining_block = joinBlockImpl<kind_, strictness_>(block, sample_block_with_columns_to_add, maps_vector_);
+            if (remaining_block.rows())
+                not_processed = std::make_shared<ExtraBlock>(ExtraBlock{std::move(remaining_block)});
+            else
+                not_processed.reset();
         }))
         {
             /// Joined
@@ -1870,10 +1961,10 @@ HashJoin::~HashJoin()
 {
     if (!data)
     {
-        LOG_TRACE(log, "({}) Join data has been already released", fmt::ptr(this));
+        LOG_TRACE(log, "{}Join data has been already released", instance_log_id);
         return;
     }
-    LOG_TRACE(log, "({}) Join data is being destroyed, {} bytes and {} rows in hash table", fmt::ptr(this), getTotalByteCount(), getTotalRowCount());
+    LOG_TRACE(log, "{}Join data is being destroyed, {} bytes and {} rows in hash table", instance_log_id, getTotalByteCount(), getTotalRowCount());
 }
 
 template <typename Mapped>
@@ -1940,9 +2031,9 @@ public:
         }
         else
         {
-            auto fill_callback = [&](auto, auto strictness, auto & map)
+            auto fill_callback = [&](auto, auto, auto & map)
             {
-                rows_added = fillColumnsFromMap<strictness>(map, columns_right);
+                rows_added = fillColumnsFromMap(map, columns_right);
             };
 
             if (!joinDispatch(parent.kind, parent.strictness, parent.data->maps.front(), fill_callback))
@@ -2003,24 +2094,24 @@ private:
         return rows_added;
     }
 
-    template <JoinStrictness STRICTNESS, typename Maps>
+    template <typename Maps>
     size_t fillColumnsFromMap(const Maps & maps, MutableColumns & columns_keys_and_right)
     {
         switch (parent.data->type)
         {
         #define M(TYPE) \
             case HashJoin::Type::TYPE: \
-                return fillColumns<STRICTNESS>(*maps.TYPE, columns_keys_and_right);
+                return fillColumns(*maps.TYPE, columns_keys_and_right);
             APPLY_FOR_JOIN_VARIANTS(M)
         #undef M
             default:
-                throw Exception(ErrorCodes::UNSUPPORTED_JOIN_KEYS, "Unsupported JOIN keys (type: {})", parent.data->type)   ;
+                throw Exception(ErrorCodes::UNSUPPORTED_JOIN_KEYS, "Unsupported JOIN keys (type: {})", parent.data->type);
         }
 
         UNREACHABLE();
     }
 
-    template <JoinStrictness STRICTNESS, typename Map>
+    template <typename Map>
     size_t fillColumns(const Map & map, MutableColumns & columns_keys_and_right)
     {
         size_t rows_added = 0;
@@ -2066,8 +2157,8 @@ private:
             {
                 const Mapped & mapped = it->getMapped();
 
-                size_t off = map.offsetInternal(it.getPtr());
-                if (parent.isUsed(off))
+                size_t offset = map.offsetInternal(it.getPtr());
+                if (parent.isUsed(offset))
                     continue;
                 AdderNonJoined<Mapped>::add(mapped, rows_added, columns_keys_and_right);
 
@@ -2154,7 +2245,7 @@ void HashJoin::reuseJoinedData(const HashJoin & join)
 
 BlocksList HashJoin::releaseJoinedBlocks(bool restructure)
 {
-    LOG_TRACE(log, "({}) Join data is being released, {} bytes and {} rows in hash table", fmt::ptr(this), getTotalByteCount(), getTotalRowCount());
+    LOG_TRACE(log, "{}Join data is being released, {} bytes and {} rows in hash table", instance_log_id, getTotalByteCount(), getTotalRowCount());
 
     BlocksList right_blocks = std::move(data->blocks);
     if (!restructure)
@@ -2178,7 +2269,7 @@ BlocksList HashJoin::releaseJoinedBlocks(bool restructure)
         for (const auto & sample_column : right_sample_block)
         {
             positions.emplace_back(tmp_block.getPositionByName(sample_column.name));
-            is_nullable.emplace_back(JoinCommon::isNullable(sample_column.type));
+            is_nullable.emplace_back(isNullableOrLowCardinalityNullable(sample_column.type));
         }
     }
 
diff --git a/src/Interpreters/HashJoin.h b/src/Interpreters/HashJoin.h
index d125e56057f..284cf5d0e7f 100644
--- a/src/Interpreters/HashJoin.h
+++ b/src/Interpreters/HashJoin.h
@@ -147,7 +147,8 @@ class HashJoin : public IJoin
 {
 public:
     HashJoin(
-        std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block, bool any_take_last_row_ = false, size_t reserve_num = 0);
+        std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block,
+        bool any_take_last_row_ = false, size_t reserve_num = 0, const String & instance_id_ = "");
 
     ~HashJoin() override;
 
@@ -436,6 +437,10 @@ private:
     bool shrink_blocks = false;
     Int64 memory_usage_before_adding_blocks = 0;
 
+    /// Identifier to distinguish different HashJoin instances in logs
+    /// Several instances can be created, for example, in GraceHashJoin to handle different buckets
+    String instance_log_id;
+
     Poco::Logger * log;
 
     /// Should be set via setLock to protect hash table from modification from StorageJoin
@@ -447,7 +452,7 @@ private:
     void initRightBlockStructure(Block & saved_block_sample);
 
     template <JoinKind KIND, JoinStrictness STRICTNESS, typename Maps>
-    void joinBlockImpl(
+    Block joinBlockImpl(
         Block & block,
         const Block & block_with_columns_to_add,
         const std::vector<const Maps *> & maps_,
diff --git a/src/Interpreters/InterpreterAlterQuery.cpp b/src/Interpreters/InterpreterAlterQuery.cpp
index ddeb4bcef2c..2a34932d950 100644
--- a/src/Interpreters/InterpreterAlterQuery.cpp
+++ b/src/Interpreters/InterpreterAlterQuery.cpp
@@ -155,6 +155,7 @@ BlockIO InterpreterAlterQuery::executeToTable(const ASTAlterQuery & alter)
         }
         else
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Wrong parameter type in ALTER query");
+
         if (!getContext()->getSettings().allow_experimental_statistic && (
             command_ast->type == ASTAlterCommand::ADD_STATISTIC ||
             command_ast->type == ASTAlterCommand::DROP_STATISTIC ||
@@ -407,6 +408,7 @@ AccessRightsElements InterpreterAlterQuery::getRequiredAccessForCommand(const AS
             break;
         }
         case ASTAlterCommand::DELETE:
+        case ASTAlterCommand::APPLY_DELETED_MASK:
         case ASTAlterCommand::DROP_PARTITION:
         case ASTAlterCommand::DROP_DETACHED_PARTITION:
         {
@@ -458,6 +460,11 @@ AccessRightsElements InterpreterAlterQuery::getRequiredAccessForCommand(const AS
             required_access.emplace_back(AccessType::ALTER_VIEW_MODIFY_QUERY, database, table);
             break;
         }
+        case ASTAlterCommand::MODIFY_REFRESH:
+        {
+            required_access.emplace_back(AccessType::ALTER_VIEW_MODIFY_REFRESH, database, table);
+            break;
+        }
         case ASTAlterCommand::LIVE_VIEW_REFRESH:
         {
             required_access.emplace_back(AccessType::ALTER_VIEW_REFRESH, database, table);
diff --git a/src/Interpreters/InterpreterCreateFunctionQuery.cpp b/src/Interpreters/InterpreterCreateFunctionQuery.cpp
index 3e87f4fe440..ea59115b077 100644
--- a/src/Interpreters/InterpreterCreateFunctionQuery.cpp
+++ b/src/Interpreters/InterpreterCreateFunctionQuery.cpp
@@ -1,11 +1,12 @@
 #include <Interpreters/InterpreterCreateFunctionQuery.h>
 
 #include <Access/ContextAccess.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
 #include <Functions/UserDefined/UserDefinedSQLFunctionFactory.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
 #include <Interpreters/removeOnClusterClauseIfNeeded.h>
+#include <Interpreters/FunctionNameNormalizer.h>
 #include <Parsers/ASTCreateFunctionQuery.h>
 
 
@@ -19,6 +20,7 @@ namespace ErrorCodes
 
 BlockIO InterpreterCreateFunctionQuery::execute()
 {
+    FunctionNameNormalizer().visit(query_ptr.get());
     const auto updated_query_ptr = removeOnClusterClauseIfNeeded(query_ptr, getContext());
     ASTCreateFunctionQuery & create_function_query = updated_query_ptr->as<ASTCreateFunctionQuery &>();
 
@@ -32,7 +34,7 @@ BlockIO InterpreterCreateFunctionQuery::execute()
 
     if (!create_function_query.cluster.empty())
     {
-        if (current_context->getUserDefinedSQLObjectsLoader().isReplicated())
+        if (current_context->getUserDefinedSQLObjectsStorage().isReplicated())
             throw Exception(ErrorCodes::INCORRECT_QUERY, "ON CLUSTER is not allowed because used-defined functions are replicated automatically");
 
         DDLQueryOnClusterParams params;
diff --git a/src/Interpreters/InterpreterCreateIndexQuery.cpp b/src/Interpreters/InterpreterCreateIndexQuery.cpp
index 3b47a002e50..ed29c82a0f0 100644
--- a/src/Interpreters/InterpreterCreateIndexQuery.cpp
+++ b/src/Interpreters/InterpreterCreateIndexQuery.cpp
@@ -4,6 +4,7 @@
 #include <Databases/DatabaseReplicated.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/executeDDLQueryOnCluster.h>
+#include <Interpreters/FunctionNameNormalizer.h>
 #include <Parsers/ASTCreateIndexQuery.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTIndexDeclaration.h>
@@ -22,6 +23,7 @@ namespace ErrorCodes
 
 BlockIO InterpreterCreateIndexQuery::execute()
 {
+    FunctionNameNormalizer().visit(query_ptr.get());
     auto current_context = getContext();
     const auto & create_index = query_ptr->as<ASTCreateIndexQuery &>();
 
diff --git a/src/Interpreters/InterpreterCreateQuery.cpp b/src/Interpreters/InterpreterCreateQuery.cpp
index 2b60b0b7b47..29abe292908 100644
--- a/src/Interpreters/InterpreterCreateQuery.cpp
+++ b/src/Interpreters/InterpreterCreateQuery.cpp
@@ -282,7 +282,7 @@ BlockIO InterpreterCreateQuery::createDatabase(ASTCreateQuery & create)
     else if (create.uuid != UUIDHelpers::Nil && !DatabaseCatalog::instance().hasUUIDMapping(create.uuid))
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot find UUID mapping for {}, it's a bug", create.uuid);
 
-    DatabasePtr database = DatabaseFactory::get(create, metadata_path / "", getContext());
+    DatabasePtr database = DatabaseFactory::instance().get(create, metadata_path / "", getContext());
 
     if (create.uuid != UUIDHelpers::Nil)
         create.setDatabase(TABLE_WITH_UUID_NAME_PLACEHOLDER);
@@ -786,10 +786,28 @@ InterpreterCreateQuery::TableProperties InterpreterCreateQuery::getTableProperti
         }
         else
         {
-            as_select_sample = InterpreterSelectWithUnionQuery::getSampleBlock(create.select->clone(),
-                getContext(),
-                false /* is_subquery */,
-                create.isParameterizedView());
+            /** To get valid sample block we need to prepare query without only_analyze, because we need to execute scalar
+              * subqueries. Otherwise functions that expect only constant arguments will throw error during query analysis,
+              * because the result of scalar subquery is not a constant.
+              *
+              * Example:
+              * CREATE MATERIALIZED VIEW test_mv ENGINE=MergeTree ORDER BY arr
+              * AS
+              * WITH (SELECT '\d[a-z]') AS constant_value
+              * SELECT extractAll(concat(toString(number), 'a'), assumeNotNull(constant_value)) AS arr
+              * FROM test_table;
+              *
+              * For new analyzer this issue does not exists because we always execute scalar subqueries.
+              * We can improve this in new analyzer, and execute scalar subqueries only in contexts when we expect constant
+              * for example: LIMIT, OFFSET, functions parameters, functions constant only arguments.
+              */
+
+            SelectQueryOptions options;
+            if (create.isParameterizedView())
+                options = options.createParameterizedView();
+
+            InterpreterSelectWithUnionQuery interpreter(create.select->clone(), getContext(), options);
+            as_select_sample = interpreter.getSampleBlock();
         }
 
         properties.columns = ColumnsDescription(as_select_sample.getNamesAndTypesList());
@@ -1071,6 +1089,13 @@ void InterpreterCreateQuery::assertOrSetUUID(ASTCreateQuery & create, const Data
                             "{} UUID specified, but engine of database {} is not Atomic", kind, create.getDatabase());
         }
 
+        if (create.refresh_strategy && database->getEngineName() != "Atomic")
+            throw Exception(ErrorCodes::INCORRECT_QUERY,
+                "Refreshable materialized view requires Atomic database engine, but database {} has engine {}", create.getDatabase(), database->getEngineName());
+                /// TODO: Support Replicated databases, only with Shared/ReplicatedMergeTree.
+                ///       Figure out how to make the refreshed data appear all at once on other
+                ///       replicas; maybe a replicated SYSTEM SYNC REPLICA query before the rename?
+
         /// The database doesn't support UUID so we'll ignore it. The UUID could be set here because of either
         /// a) the initiator of `ON CLUSTER` query generated it to ensure the same UUIDs are used on different hosts; or
         /// b) `RESTORE from backup` query generated it to ensure the same UUIDs are used on different hosts.
@@ -1192,6 +1217,16 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
         visitor.visit(*create.select);
     }
 
+    if (create.refresh_strategy)
+    {
+        if (!getContext()->getSettingsRef().allow_experimental_refreshable_materialized_view)
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED,
+                "Refreshable materialized views are experimental. Enable allow_experimental_refreshable_materialized_view to use.");
+
+        AddDefaultDatabaseVisitor visitor(getContext(), current_database);
+        visitor.visit(*create.refresh_strategy);
+    }
+
     if (create.columns_list)
     {
         AddDefaultDatabaseVisitor visitor(getContext(), current_database);
@@ -1223,7 +1258,7 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
             {
                 input_block = InterpreterSelectWithUnionQuery(create.select->clone(),
                     getContext(),
-                    SelectQueryOptions().analyze()).getSampleBlock();
+                    {}).getSampleBlock();
             }
 
             Block output_block = to_table->getInMemoryMetadataPtr()->getSampleBlock();
@@ -1252,6 +1287,23 @@ BlockIO InterpreterCreateQuery::createTable(ASTCreateQuery & create)
     if (need_add_to_database)
         database = DatabaseCatalog::instance().tryGetDatabase(database_name);
 
+    if (database && database->getEngineName() == "Replicated" && create.select)
+    {
+        bool is_storage_replicated = false;
+        if (create.storage && create.storage->engine)
+        {
+            const auto & storage_name = create.storage->engine->name;
+            if (storage_name.starts_with("Replicated") || storage_name.starts_with("Shared"))
+                is_storage_replicated = true;
+        }
+
+        const bool allow_create_select_for_replicated = create.isView() || create.is_create_empty || !is_storage_replicated;
+        if (!allow_create_select_for_replicated)
+            throw Exception(
+                ErrorCodes::SUPPORT_IS_DISABLED,
+                "CREATE AS SELECT is not supported with Replicated databases. Use separate CREATE and INSERT queries");
+    }
+
     if (need_add_to_database && database && database->shouldReplicateQuery(getContext(), query_ptr))
     {
         chassert(!ddl_guard);
@@ -1712,7 +1764,7 @@ void InterpreterCreateQuery::prepareOnClusterQuery(ASTCreateQuery & create, Cont
 
         throw Exception(ErrorCodes::INCORRECT_QUERY,
                         "Seems like cluster is configured for cross-replication, "
-                        "but zookeeper_path for ReplicatedMergeTree is not specified or contains {uuid} macro. "
+                        "but zookeeper_path for ReplicatedMergeTree is not specified or contains {{uuid}} macro. "
                         "It's not supported for cross replication, because tables must have different UUIDs. "
                         "Please specify unique zookeeper_path explicitly.");
     }
diff --git a/src/Interpreters/InterpreterDescribeCacheQuery.cpp b/src/Interpreters/InterpreterDescribeCacheQuery.cpp
index 69b612eb2ef..54b43a8850b 100644
--- a/src/Interpreters/InterpreterDescribeCacheQuery.cpp
+++ b/src/Interpreters/InterpreterDescribeCacheQuery.cpp
@@ -42,8 +42,8 @@ BlockIO InterpreterDescribeCacheQuery::execute()
     MutableColumns res_columns = sample_block.cloneEmptyColumns();
 
     auto cache_data = FileCacheFactory::instance().getByName(ast.cache_name);
-    const auto & settings = cache_data.settings;
-    const auto & cache = cache_data.cache;
+    auto settings = cache_data->getSettings();
+    const auto & cache = cache_data->cache;
 
     size_t i = 0;
     res_columns[i++]->insert(settings.max_size);
diff --git a/src/Interpreters/InterpreterDropFunctionQuery.cpp b/src/Interpreters/InterpreterDropFunctionQuery.cpp
index af60d9c5df7..c2cd24044da 100644
--- a/src/Interpreters/InterpreterDropFunctionQuery.cpp
+++ b/src/Interpreters/InterpreterDropFunctionQuery.cpp
@@ -1,7 +1,7 @@
 #include <Interpreters/InterpreterDropFunctionQuery.h>
 
 #include <Access/ContextAccess.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
 #include <Functions/UserDefined/UserDefinedSQLFunctionFactory.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/FunctionNameNormalizer.h>
@@ -32,7 +32,7 @@ BlockIO InterpreterDropFunctionQuery::execute()
 
     if (!drop_function_query.cluster.empty())
     {
-        if (current_context->getUserDefinedSQLObjectsLoader().isReplicated())
+        if (current_context->getUserDefinedSQLObjectsStorage().isReplicated())
             throw Exception(ErrorCodes::INCORRECT_QUERY, "ON CLUSTER is not allowed because used-defined functions are replicated automatically");
 
         DDLQueryOnClusterParams params;
diff --git a/src/Interpreters/InterpreterSelectQuery.cpp b/src/Interpreters/InterpreterSelectQuery.cpp
index 4f4e96a9be7..cdf1b4228bc 100644
--- a/src/Interpreters/InterpreterSelectQuery.cpp
+++ b/src/Interpreters/InterpreterSelectQuery.cpp
@@ -481,7 +481,7 @@ InterpreterSelectQuery::InterpreterSelectQuery(
 
     /// Check support for FINAL for parallel replicas
     bool is_query_with_final = isQueryWithFinal(query_info);
-    if (is_query_with_final && settings.allow_experimental_parallel_reading_from_replicas > 0)
+    if (is_query_with_final && context->canUseTaskBasedParallelReplicas())
     {
         if (settings.allow_experimental_parallel_reading_from_replicas == 1)
         {
@@ -870,7 +870,38 @@ bool InterpreterSelectQuery::adjustParallelReplicasAfterAnalysis()
     ASTSelectQuery & query = getSelectQuery();
 
     /// While only_analyze we don't know anything about parts, so any decision about how many parallel replicas to use would be wrong
-    if (!storage || options.only_analyze || !context->canUseParallelReplicasOnInitiator())
+    if (!storage || !context->canUseParallelReplicasOnInitiator())
+        return false;
+
+    /// check if IN operator with subquery is present in the query
+    /// if so, disable parallel replicas
+    if (query_analyzer->getPreparedSets()->hasSubqueries())
+    {
+        bool in_subqueries = false;
+        const auto & sets = query_analyzer->getPreparedSets();
+        const auto subqueries = sets->getSubqueries();
+        for (const auto & subquery : subqueries)
+        {
+            if (subquery->isINSubquery())
+            {
+                in_subqueries = true;
+                break;
+            }
+        }
+
+        if (in_subqueries)
+        {
+            if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "IN with subquery is not supported with parallel replicas");
+
+            context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+            context->setSetting("max_parallel_replicas", UInt64{0});
+            LOG_DEBUG(log, "Disabling parallel replicas to execute a query with IN with subquery");
+            return true;
+        }
+    }
+
+    if (options.only_analyze)
         return false;
 
     if (getTrivialCount(0).has_value())
@@ -1698,7 +1729,7 @@ void InterpreterSelectQuery::executeImpl(QueryPlan & query_plan, std::optional<P
                         return step_raw_ptr;
                     };
 
-                    if (expressions.join->pipelineType() == JoinPipelineType::YShaped)
+                    if (expressions.join->pipelineType() == JoinPipelineType::YShaped && expressions.join->getTableJoin().kind() != JoinKind::Paste)
                     {
                         const auto & table_join = expressions.join->getTableJoin();
                         const auto & join_clause = table_join.getOnlyClause();
@@ -2006,7 +2037,7 @@ static void executeMergeAggregatedImpl(
       *  but it can work more slowly.
       */
 
-    Aggregator::Params params(keys, aggregates, overflow_row, settings.max_threads, settings.max_block_size);
+    Aggregator::Params params(keys, aggregates, overflow_row, settings.max_threads, settings.max_block_size, settings.min_hit_rate_to_use_consecutive_keys_optimization);
 
     auto merging_aggregated = std::make_unique<MergingAggregatedStep>(
         query_plan.getCurrentDataStream(),
@@ -2672,6 +2703,7 @@ static Aggregator::Params getAggregatorParams(
         settings.enable_software_prefetch_in_aggregation,
         /* only_merge */ false,
         settings.optimize_group_by_constant_keys,
+        settings.min_hit_rate_to_use_consecutive_keys_optimization,
         stats_collecting_params
     };
 }
diff --git a/src/Interpreters/InterpreterSystemQuery.cpp b/src/Interpreters/InterpreterSystemQuery.cpp
index 9c3db6cfdbd..db02ee13a4f 100644
--- a/src/Interpreters/InterpreterSystemQuery.cpp
+++ b/src/Interpreters/InterpreterSystemQuery.cpp
@@ -45,6 +45,7 @@
 #include <Access/Common/AllowedClientHosts.h>
 #include <Databases/IDatabase.h>
 #include <Databases/DatabaseReplicated.h>
+#include <Disks/ObjectStorages/IMetadataStorage.h>
 #include <Storages/StorageDistributed.h>
 #include <Storages/StorageReplicatedMergeTree.h>
 #include <Storages/Freeze.h>
@@ -53,6 +54,7 @@
 #include <Storages/StorageS3.h>
 #include <Storages/StorageURL.h>
 #include <Storages/StorageAzureBlob.h>
+#include <Storages/MaterializedView/RefreshTask.h>
 #include <Storages/HDFS/StorageHDFS.h>
 #include <Storages/System/StorageSystemFilesystemCache.h>
 #include <Parsers/ASTSystemQuery.h>
@@ -92,6 +94,7 @@ namespace ErrorCodes
     extern const int TIMEOUT_EXCEEDED;
     extern const int TABLE_WAS_NOT_DROPPED;
     extern const int ABORTED;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 
@@ -106,6 +109,7 @@ namespace ActionLocks
     extern const StorageActionBlockType PartsMove;
     extern const StorageActionBlockType PullReplicationLog;
     extern const StorageActionBlockType Cleanup;
+    extern const StorageActionBlockType ViewRefresh;
 }
 
 
@@ -163,6 +167,8 @@ AccessType getRequiredAccessType(StorageActionBlockType action_type)
         return AccessType::SYSTEM_PULLING_REPLICATION_LOG;
     else if (action_type == ActionLocks::Cleanup)
         return AccessType::SYSTEM_CLEANUP;
+    else if (action_type == ActionLocks::ViewRefresh)
+        return AccessType::SYSTEM_VIEWS;
     else
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown action type: {}", std::to_string(action_type));
 }
@@ -287,7 +293,7 @@ BlockIO InterpreterSystemQuery::execute()
         {
             getContext()->checkAccess(AccessType::SYSTEM_SHUTDOWN);
             if (kill(0, SIGTERM))
-                throwFromErrno("System call kill(0, SIGTERM) failed", ErrorCodes::CANNOT_KILL);
+                throw ErrnoException(ErrorCodes::CANNOT_KILL, "System call kill(0, SIGTERM) failed");
             break;
         }
         case Type::KILL:
@@ -378,7 +384,7 @@ BlockIO InterpreterSystemQuery::execute()
             }
             else
             {
-                auto cache = FileCacheFactory::instance().getByName(query.filesystem_cache_name).cache;
+                auto cache = FileCacheFactory::instance().getByName(query.filesystem_cache_name)->cache;
                 if (query.key_to_drop.empty())
                 {
                     cache->removeAllReleasable();
@@ -409,15 +415,15 @@ BlockIO InterpreterSystemQuery::execute()
 
             MutableColumns res_columns = sample_block.cloneEmptyColumns();
 
-            auto fill_data = [&](const std::string & cache_name, const FileCachePtr & cache, const FileSegments & file_segments)
+            auto fill_data = [&](const std::string & cache_name, const FileCachePtr & cache, const std::vector<FileSegment::Info> & file_segments)
             {
                 for (const auto & file_segment : file_segments)
                 {
                     size_t i = 0;
-                    const auto path = cache->getPathInLocalCache(file_segment->key(), file_segment->offset(), file_segment->getKind());
+                    const auto path = cache->getPathInLocalCache(file_segment.key, file_segment.offset, file_segment.kind);
                     res_columns[i++]->insert(cache_name);
                     res_columns[i++]->insert(path);
-                    res_columns[i++]->insert(file_segment->getDownloadedSize());
+                    res_columns[i++]->insert(file_segment.downloaded_size);
                 }
             };
 
@@ -432,7 +438,7 @@ BlockIO InterpreterSystemQuery::execute()
             }
             else
             {
-                auto cache = FileCacheFactory::instance().getByName(query.filesystem_cache_name).cache;
+                auto cache = FileCacheFactory::instance().getByName(query.filesystem_cache_name)->cache;
                 auto file_segments = cache->sync();
                 fill_data(query.filesystem_cache_name, cache, file_segments);
             }
@@ -442,6 +448,10 @@ BlockIO InterpreterSystemQuery::execute()
             result.pipeline = QueryPipeline(std::move(source));
             break;
         }
+        case Type::DROP_DISK_METADATA_CACHE:
+        {
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Not implemented");
+        }
         case Type::DROP_SCHEMA_CACHE:
         {
             getContext()->checkAccess(AccessType::SYSTEM_DROP_SCHEMA_CACHE);
@@ -599,6 +609,23 @@ BlockIO InterpreterSystemQuery::execute()
         case Type::START_CLEANUP:
             startStopAction(ActionLocks::Cleanup, true);
             break;
+        case Type::START_VIEW:
+        case Type::START_VIEWS:
+            startStopAction(ActionLocks::ViewRefresh, true);
+            break;
+        case Type::STOP_VIEW:
+        case Type::STOP_VIEWS:
+            startStopAction(ActionLocks::ViewRefresh, false);
+            break;
+        case Type::REFRESH_VIEW:
+            getRefreshTask()->run();
+            break;
+        case Type::CANCEL_VIEW:
+            getRefreshTask()->cancel();
+            break;
+        case Type::TEST_VIEW:
+            getRefreshTask()->setFakeTime(query.fake_time_for_view);
+            break;
         case Type::DROP_REPLICA:
             dropReplica(query);
             break;
@@ -611,6 +638,10 @@ BlockIO InterpreterSystemQuery::execute()
         case Type::SYNC_DATABASE_REPLICA:
             syncReplicatedDatabase(query);
             break;
+        case Type::REPLICA_UNREADY:
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Not implemented");
+        case Type::REPLICA_READY:
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Not implemented");
         case Type::SYNC_TRANSACTION_LOG:
             syncTransactionLog();
             break;
@@ -954,7 +985,7 @@ void InterpreterSystemQuery::dropDatabaseReplica(ASTSystemQuery & query)
         if (auto * replicated = dynamic_cast<DatabaseReplicated *>(database.get()))
         {
             check_not_local_replica(replicated, query);
-            DatabaseReplicated::dropReplica(replicated, replicated->getZooKeeperPath(), query.shard, query.replica);
+            DatabaseReplicated::dropReplica(replicated, replicated->getZooKeeperPath(), query.shard, query.replica, /*throw_if_noop*/ true);
         }
         else
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Database {} is not Replicated, cannot drop replica", query.getDatabase());
@@ -979,7 +1010,7 @@ void InterpreterSystemQuery::dropDatabaseReplica(ASTSystemQuery & query)
             }
 
             check_not_local_replica(replicated, query);
-            DatabaseReplicated::dropReplica(replicated, replicated->getZooKeeperPath(), query.shard, query.replica);
+            DatabaseReplicated::dropReplica(replicated, replicated->getZooKeeperPath(), query.shard, query.replica, /*throw_if_noop*/ false);
             LOG_TRACE(log, "Dropped replica {} of Replicated database {}", query.replica, backQuoteIfNeed(database->getDatabaseName()));
         }
     }
@@ -992,7 +1023,7 @@ void InterpreterSystemQuery::dropDatabaseReplica(ASTSystemQuery & query)
             if (auto * replicated = dynamic_cast<DatabaseReplicated *>(elem.second.get()))
                 check_not_local_replica(replicated, query);
 
-        DatabaseReplicated::dropReplica(nullptr, query.replica_zk_path, query.shard, query.replica);
+        DatabaseReplicated::dropReplica(nullptr, query.replica_zk_path, query.shard, query.replica, /*throw_if_noop*/ true);
         LOG_INFO(log, "Dropped replica {} of Replicated database with path {}", query.replica, query.replica_zk_path);
     }
     else
@@ -1082,6 +1113,17 @@ void InterpreterSystemQuery::flushDistributed(ASTSystemQuery &)
     throw Exception(ErrorCodes::NOT_IMPLEMENTED, "SYSTEM RESTART DISK is not supported");
 }
 
+RefreshTaskHolder InterpreterSystemQuery::getRefreshTask()
+{
+    auto ctx = getContext();
+    ctx->checkAccess(AccessType::SYSTEM_VIEWS);
+    auto task = ctx->getRefreshSet().getTask(table_id);
+    if (!task)
+        throw Exception(
+            ErrorCodes::BAD_ARGUMENTS, "Refreshable view {} doesn't exist", table_id.getNameForLogs());
+    return task;
+}
+
 
 AccessRightsElements InterpreterSystemQuery::getRequiredAccessForDDLOnCluster() const
 {
@@ -1119,6 +1161,8 @@ AccessRightsElements InterpreterSystemQuery::getRequiredAccessForDDLOnCluster()
             required_access.emplace_back(AccessType::SYSTEM_DROP_CACHE);
             break;
         }
+        case Type::DROP_DISK_METADATA_CACHE:
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Not implemented");
         case Type::RELOAD_DICTIONARY:
         case Type::RELOAD_DICTIONARIES:
         case Type::RELOAD_EMBEDDED_DICTIONARIES:
@@ -1229,6 +1273,20 @@ AccessRightsElements InterpreterSystemQuery::getRequiredAccessForDDLOnCluster()
                 required_access.emplace_back(AccessType::SYSTEM_REPLICATION_QUEUES, query.getDatabase(), query.getTable());
             break;
         }
+        case Type::REFRESH_VIEW:
+        case Type::START_VIEW:
+        case Type::START_VIEWS:
+        case Type::STOP_VIEW:
+        case Type::STOP_VIEWS:
+        case Type::CANCEL_VIEW:
+        case Type::TEST_VIEW:
+        {
+            if (!query.table)
+                required_access.emplace_back(AccessType::SYSTEM_VIEWS);
+            else
+                required_access.emplace_back(AccessType::SYSTEM_VIEWS, query.getDatabase(), query.getTable());
+            break;
+        }
         case Type::DROP_REPLICA:
         case Type::DROP_DATABASE_REPLICA:
         {
@@ -1245,6 +1303,9 @@ AccessRightsElements InterpreterSystemQuery::getRequiredAccessForDDLOnCluster()
             required_access.emplace_back(AccessType::SYSTEM_SYNC_REPLICA, query.getDatabase(), query.getTable());
             break;
         }
+        case Type::REPLICA_READY:
+        case Type::REPLICA_UNREADY:
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Not implemented");
         case Type::RESTART_REPLICA:
         {
             required_access.emplace_back(AccessType::SYSTEM_RESTART_REPLICA, query.getDatabase(), query.getTable());
diff --git a/src/Interpreters/InterpreterSystemQuery.h b/src/Interpreters/InterpreterSystemQuery.h
index 826d4cc0c69..89de7402b4d 100644
--- a/src/Interpreters/InterpreterSystemQuery.h
+++ b/src/Interpreters/InterpreterSystemQuery.h
@@ -3,6 +3,7 @@
 #include <Interpreters/IInterpreter.h>
 #include <Parsers/IAST_fwd.h>
 #include <Storages/IStorage_fwd.h>
+#include <Storages/MaterializedView/RefreshTask_fwd.h>
 #include <Interpreters/StorageID.h>
 #include <Common/ActionLock.h>
 #include <Disks/IVolume.h>
@@ -57,6 +58,7 @@ private:
     void restartReplica(const StorageID & replica, ContextMutablePtr system_context);
     void restartReplicas(ContextMutablePtr system_context);
     void syncReplica(ASTSystemQuery & query);
+    void setReplicaReadiness(bool ready);
     void waitLoadingParts();
 
     void syncReplicatedDatabase(ASTSystemQuery & query);
@@ -71,6 +73,8 @@ private:
     void flushDistributed(ASTSystemQuery & query);
     [[noreturn]] void restartDisk(String & name);
 
+    RefreshTaskHolder getRefreshTask();
+
     AccessRightsElements getRequiredAccessForDDLOnCluster() const;
     void startStopAction(StorageActionBlockType action_type, bool start);
 };
diff --git a/src/Interpreters/InterpreterWatchQuery.cpp b/src/Interpreters/InterpreterWatchQuery.cpp
index e1af704a358..8865c47a785 100644
--- a/src/Interpreters/InterpreterWatchQuery.cpp
+++ b/src/Interpreters/InterpreterWatchQuery.cpp
@@ -61,7 +61,7 @@ QueryPipelineBuilder InterpreterWatchQuery::buildQueryPipeline()
     storage = DatabaseCatalog::instance().tryGetTable(table_id, getContext());
 
     if (!storage)
-        throw Exception(ErrorCodes::UNKNOWN_TABLE, "Table {} doesn't exist.", table_id.getNameForLogs());
+        throw Exception(ErrorCodes::UNKNOWN_TABLE, "Table {} does not exist.", table_id.getNameForLogs());
 
     auto storage_name = storage->getName();
     if (storage_name == "LiveView"
diff --git a/src/Interpreters/JIT/CHJIT.cpp b/src/Interpreters/JIT/CHJIT.cpp
index 63fe4f44f5f..046d0b4fc10 100644
--- a/src/Interpreters/JIT/CHJIT.cpp
+++ b/src/Interpreters/JIT/CHJIT.cpp
@@ -153,7 +153,7 @@ public:
             {
                 int res = mprotect(block.base(), block.blockSize(), protection_flags | PROT_READ);
                 if (res != 0)
-                    throwFromErrno("Cannot mprotect memory region", ErrorCodes::CANNOT_MPROTECT);
+                    throw ErrnoException(ErrorCodes::CANNOT_MPROTECT, "Cannot mprotect memory region");
 
                 llvm::sys::Memory::InvalidateInstructionCache(block.base(), block.blockSize());
                 invalidate_cache = false;
@@ -161,7 +161,7 @@ public:
 #    endif
             int res = mprotect(block.base(), block.blockSize(), protection_flags);
             if (res != 0)
-                throwFromErrno("Cannot mprotect memory region", ErrorCodes::CANNOT_MPROTECT);
+                throw ErrnoException(ErrorCodes::CANNOT_MPROTECT, "Cannot mprotect memory region");
 
             if (invalidate_cache)
                 llvm::sys::Memory::InvalidateInstructionCache(block.base(), block.blockSize());
@@ -232,10 +232,12 @@ private:
         int res = posix_memalign(&buf, page_size, allocate_size);
 
         if (res != 0)
-            throwFromErrno(
-                fmt::format("Cannot allocate memory (posix_memalign) alignment {} size {}.", page_size, ReadableSize(allocate_size)),
+            ErrnoException::throwWithErrno(
                 ErrorCodes::CANNOT_ALLOCATE_MEMORY,
-                res);
+                res,
+                "Cannot allocate memory (posix_memalign) alignment {} size {}",
+                page_size,
+                ReadableSize(allocate_size));
 
         page_blocks.emplace_back(buf, pages_to_allocate_size, page_size);
         page_blocks_allocated_size.emplace_back(0);
@@ -244,6 +246,31 @@ private:
     }
 };
 
+#ifdef PRINT_ASSEMBLY
+
+class AssemblyPrinter
+{
+public:
+    explicit AssemblyPrinter(llvm::TargetMachine &target_machine_)
+    : target_machine(target_machine_)
+    {
+    }
+
+    void print(llvm::Module & module)
+    {
+        llvm::legacy::PassManager pass_manager;
+        target_machine.Options.MCOptions.AsmVerbose = true;
+        if (target_machine.addPassesToEmitFile(pass_manager, llvm::errs(), nullptr, llvm::CodeGenFileType::CGFT_AssemblyFile))
+            throw Exception(ErrorCodes::CANNOT_COMPILE_CODE, "MachineCode cannot be printed");
+
+        pass_manager.run(module);
+    }
+private:
+    llvm::TargetMachine & target_machine;
+};
+
+#endif
+
 /** MemoryManager for module.
   * Keep total allocated size during RuntimeDyld linker execution.
   */
@@ -375,6 +402,11 @@ CHJIT::CompiledModule CHJIT::compileModule(std::unique_ptr<llvm::Module> module)
 {
     runOptimizationPassesOnModule(*module);
 
+#ifdef PRINT_ASSEMBLY
+    AssemblyPrinter assembly_printer(*machine);
+    assembly_printer.print(*module);
+#endif
+
     auto buffer = compiler->compile(*module);
 
     llvm::Expected<std::unique_ptr<llvm::object::ObjectFile>> object = llvm::object::ObjectFile::createObjectFile(*buffer);
diff --git a/src/Interpreters/JIT/compileFunction.cpp b/src/Interpreters/JIT/compileFunction.cpp
index f50a122f9a2..1c6b324dad7 100644
--- a/src/Interpreters/JIT/compileFunction.cpp
+++ b/src/Interpreters/JIT/compileFunction.cpp
@@ -67,7 +67,8 @@ static void compileFunction(llvm::Module & module, const IFunctionBase & functio
 {
     const auto & function_argument_types = function.getArgumentTypes();
 
-    llvm::IRBuilder<> b(module.getContext());
+    auto & context = module.getContext();
+    llvm::IRBuilder<> b(context);
     auto * size_type = b.getIntNTy(sizeof(size_t) * 8);
     auto * data_type = llvm::StructType::get(b.getInt8PtrTy(), b.getInt8PtrTy());
     auto * func_type = llvm::FunctionType::get(b.getVoidTy(), { size_type, data_type->getPointerTo() }, /*isVarArg=*/false);
@@ -75,6 +76,8 @@ static void compileFunction(llvm::Module & module, const IFunctionBase & functio
     /// Create function in module
 
     auto * func = llvm::Function::Create(func_type, llvm::Function::ExternalLinkage, function.getName(), module);
+    func->setAttributes(llvm::AttributeList::get(context, {{2, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)}}));
+
     auto * args = func->args().begin();
     llvm::Value * rows_count_arg = args++;
     llvm::Value * columns_arg = args++;
@@ -196,6 +199,9 @@ static void compileCreateAggregateStatesFunctions(llvm::Module & module, const s
     auto * create_aggregate_states_function_type = llvm::FunctionType::get(b.getVoidTy(), { aggregate_data_places_type }, false);
     auto * create_aggregate_states_function = llvm::Function::Create(create_aggregate_states_function_type, llvm::Function::ExternalLinkage, name, module);
 
+    create_aggregate_states_function->setAttributes(
+        llvm::AttributeList::get(context, {{1, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)}}));
+
     auto * arguments = create_aggregate_states_function->args().begin();
     llvm::Value * aggregate_data_place_arg = arguments++;
 
@@ -241,6 +247,11 @@ static void compileAddIntoAggregateStatesFunctions(llvm::Module & module,
     auto * add_into_aggregate_states_func_declaration = llvm::FunctionType::get(b.getVoidTy(), { size_type, size_type, column_type->getPointerTo(), places_type }, false);
     auto * add_into_aggregate_states_func = llvm::Function::Create(add_into_aggregate_states_func_declaration, llvm::Function::ExternalLinkage, name, module);
 
+    add_into_aggregate_states_func->setAttributes(llvm::AttributeList::get(
+        context,
+        {{3, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)},
+         {4, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)}}));
+
     auto * arguments = add_into_aggregate_states_func->args().begin();
     llvm::Value * row_start_arg = arguments++;
     llvm::Value * row_end_arg = arguments++;
@@ -296,7 +307,7 @@ static void compileAddIntoAggregateStatesFunctions(llvm::Module & module,
     llvm::Value * aggregation_place = nullptr;
 
     if (places_argument_type == AddIntoAggregateStatesPlacesArgumentType::MultiplePlaces)
-        aggregation_place = b.CreateLoad(b.getInt8Ty()->getPointerTo(), b.CreateGEP(b.getInt8Ty()->getPointerTo(), places_arg, counter_phi));
+        aggregation_place = b.CreateLoad(b.getInt8Ty()->getPointerTo(), b.CreateInBoundsGEP(b.getInt8Ty()->getPointerTo(), places_arg, counter_phi));
     else
         aggregation_place = places_arg;
 
@@ -313,7 +324,7 @@ static void compileAddIntoAggregateStatesFunctions(llvm::Module & module,
             auto & column = columns[previous_columns_size + column_argument_index];
             const auto & argument_type = arguments_types[column_argument_index];
 
-            auto * column_data_element = b.CreateLoad(column.data_element_type, b.CreateGEP(column.data_element_type, column.data_ptr, counter_phi));
+            auto * column_data_element = b.CreateLoad(column.data_element_type, b.CreateInBoundsGEP(column.data_element_type, column.data_ptr, counter_phi));
 
             if (!argument_type->isNullable())
             {
@@ -321,7 +332,7 @@ static void compileAddIntoAggregateStatesFunctions(llvm::Module & module,
                 continue;
             }
 
-            auto * column_null_data_with_offset = b.CreateGEP(b.getInt8Ty(), column.null_data_ptr, counter_phi);
+            auto * column_null_data_with_offset = b.CreateInBoundsGEP(b.getInt8Ty(), column.null_data_ptr, counter_phi);
             auto * is_null = b.CreateICmpNE(b.CreateLoad(b.getInt8Ty(), column_null_data_with_offset), b.getInt8(0));
             auto * nullable_unitialized = llvm::Constant::getNullValue(toNullableType(b, column.data_element_type));
             auto * first_insert = b.CreateInsertValue(nullable_unitialized, column_data_element, {0});
@@ -354,7 +365,8 @@ static void compileAddIntoAggregateStatesFunctions(llvm::Module & module,
 
 static void compileMergeAggregatesStates(llvm::Module & module, const std::vector<AggregateFunctionWithOffset> & functions, const std::string & name)
 {
-    llvm::IRBuilder<> b(module.getContext());
+    auto & context = module.getContext();
+    llvm::IRBuilder<> b(context);
 
     auto * aggregate_data_place_type = b.getInt8Ty()->getPointerTo();
     auto * aggregate_data_places_type = aggregate_data_place_type->getPointerTo();
@@ -365,6 +377,11 @@ static void compileMergeAggregatesStates(llvm::Module & module, const std::vecto
     auto * merge_aggregates_states_func
         = llvm::Function::Create(merge_aggregates_states_func_declaration, llvm::Function::ExternalLinkage, name, module);
 
+    merge_aggregates_states_func->setAttributes(llvm::AttributeList::get(
+        context,
+        {{1, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)},
+         {2, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)}}));
+
     auto * arguments = merge_aggregates_states_func->args().begin();
     llvm::Value * aggregate_data_places_dst_arg = arguments++;
     llvm::Value * aggregate_data_places_src_arg = arguments++;
@@ -426,6 +443,11 @@ static void compileInsertAggregatesIntoResultColumns(llvm::Module & module, cons
     auto * insert_aggregates_into_result_func_declaration = llvm::FunctionType::get(b.getVoidTy(), { size_type, size_type, column_type->getPointerTo(), aggregate_data_places_type }, false);
     auto * insert_aggregates_into_result_func = llvm::Function::Create(insert_aggregates_into_result_func_declaration, llvm::Function::ExternalLinkage, name, module);
 
+    insert_aggregates_into_result_func->setAttributes(llvm::AttributeList::get(
+        context,
+        {{3, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)},
+         {4, llvm::Attribute::get(context, llvm::Attribute::AttrKind::NoAlias)}}));
+
     auto * arguments = insert_aggregates_into_result_func->args().begin();
     llvm::Value * row_start_arg = arguments++;
     llvm::Value * row_end_arg = arguments++;
@@ -460,7 +482,7 @@ static void compileInsertAggregatesIntoResultColumns(llvm::Module & module, cons
     auto * counter_phi = b.CreatePHI(row_start_arg->getType(), 2);
     counter_phi->addIncoming(row_start_arg, entry);
 
-    auto * aggregate_data_place = b.CreateLoad(b.getInt8Ty()->getPointerTo(), b.CreateGEP(b.getInt8Ty()->getPointerTo(), aggregate_data_places_arg, counter_phi));
+    auto * aggregate_data_place = b.CreateLoad(b.getInt8Ty()->getPointerTo(), b.CreateInBoundsGEP(b.getInt8Ty()->getPointerTo(), aggregate_data_places_arg, counter_phi));
 
     for (size_t i = 0; i < functions.size(); ++i)
     {
@@ -470,11 +492,11 @@ static void compileInsertAggregatesIntoResultColumns(llvm::Module & module, cons
         const auto * aggregate_function_ptr = functions[i].function;
         auto * final_value = aggregate_function_ptr->compileGetResult(b, aggregation_place_with_offset);
 
-        auto * result_column_data_element = b.CreateGEP(columns[i].data_element_type, columns[i].data_ptr, counter_phi);
+        auto * result_column_data_element = b.CreateInBoundsGEP(columns[i].data_element_type, columns[i].data_ptr, counter_phi);
         if (columns[i].null_data_ptr)
         {
             b.CreateStore(b.CreateExtractValue(final_value, {0}), result_column_data_element);
-            auto * result_column_is_null_element = b.CreateGEP(b.getInt8Ty(), columns[i].null_data_ptr, counter_phi);
+            auto * result_column_is_null_element = b.CreateInBoundsGEP(b.getInt8Ty(), columns[i].null_data_ptr, counter_phi);
             b.CreateStore(b.CreateSelect(b.CreateExtractValue(final_value, {1}), b.getInt8(1), b.getInt8(0)), result_column_is_null_element);
         }
         else
diff --git a/src/Interpreters/JoinUtils.cpp b/src/Interpreters/JoinUtils.cpp
index 33c9dfa76ca..6bd202a1dd7 100644
--- a/src/Interpreters/JoinUtils.cpp
+++ b/src/Interpreters/JoinUtils.cpp
@@ -120,19 +120,11 @@ bool canBecomeNullable(const DataTypePtr & type)
     return can_be_inside;
 }
 
-bool isNullable(const DataTypePtr & type)
-{
-    bool is_nullable = type->isNullable();
-    if (const auto * low_cardinality_type = typeid_cast<const DataTypeLowCardinality *>(type.get()))
-        is_nullable |= low_cardinality_type->getDictionaryType()->isNullable();
-    return is_nullable;
-}
-
 /// Add nullability to type.
 /// Note: LowCardinality(T) transformed to LowCardinality(Nullable(T))
 DataTypePtr convertTypeToNullable(const DataTypePtr & type)
 {
-    if (isNullable(type))
+    if (isNullableOrLowCardinalityNullable(type))
         return type;
 
     if (const auto * low_cardinality_type = typeid_cast<const DataTypeLowCardinality *>(type.get()))
@@ -323,20 +315,6 @@ ColumnRawPtrs materializeColumnsInplace(Block & block, const Names & names)
     return ptrs;
 }
 
-ColumnPtrMap materializeColumnsInplaceMap(const Block & block, const Names & names)
-{
-    ColumnPtrMap ptrs;
-    ptrs.reserve(names.size());
-
-    for (const auto & column_name : names)
-    {
-        ColumnPtr column = block.getByName(column_name).column;
-        ptrs[column_name] = materializeColumn(column);
-    }
-
-    return ptrs;
-}
-
 ColumnPtr materializeColumn(const Block & block, const String & column_name)
 {
     const auto & src_column = block.getByName(column_name).column;
@@ -367,27 +345,6 @@ ColumnRawPtrs getRawPointers(const Columns & columns)
     return ptrs;
 }
 
-void convertToFullColumnsInplace(Block & block)
-{
-    for (size_t i = 0; i < block.columns(); ++i)
-    {
-        auto & col = block.getByPosition(i);
-        col.column = recursiveRemoveLowCardinality(recursiveRemoveSparse(col.column));
-        col.type = recursiveRemoveLowCardinality(col.type);
-    }
-}
-
-void convertToFullColumnsInplace(Block & block, const Names & names, bool change_type)
-{
-    for (const String & column_name : names)
-    {
-        auto & col = block.getByName(column_name);
-        col.column = recursiveRemoveLowCardinality(recursiveRemoveSparse(col.column));
-        if (change_type)
-            col.type = recursiveRemoveLowCardinality(col.type);
-    }
-}
-
 void restoreLowCardinalityInplace(Block & block, const Names & lowcard_keys)
 {
     for (const auto & column_name : lowcard_keys)
@@ -517,8 +474,8 @@ void addDefaultValues(IColumn & column, const DataTypePtr & type, size_t count)
 
 bool typesEqualUpToNullability(DataTypePtr left_type, DataTypePtr right_type)
 {
-    DataTypePtr left_type_strict = removeNullable(recursiveRemoveLowCardinality(left_type));
-    DataTypePtr right_type_strict = removeNullable(recursiveRemoveLowCardinality(right_type));
+    DataTypePtr left_type_strict = removeNullable(removeLowCardinality(left_type));
+    DataTypePtr right_type_strict = removeNullable(removeLowCardinality(right_type));
     return left_type_strict->equals(*right_type_strict);
 }
 
diff --git a/src/Interpreters/JoinUtils.h b/src/Interpreters/JoinUtils.h
index f112ca22e5b..ff48f34d82c 100644
--- a/src/Interpreters/JoinUtils.h
+++ b/src/Interpreters/JoinUtils.h
@@ -59,7 +59,6 @@ private:
 };
 
 
-bool isNullable(const DataTypePtr & type);
 bool canBecomeNullable(const DataTypePtr & type);
 DataTypePtr convertTypeToNullable(const DataTypePtr & type);
 void convertColumnToNullable(ColumnWithTypeAndName & column);
@@ -71,10 +70,7 @@ ColumnPtr emptyNotNullableClone(const ColumnPtr & column);
 ColumnPtr materializeColumn(const Block & block, const String & name);
 Columns materializeColumns(const Block & block, const Names & names);
 ColumnRawPtrs materializeColumnsInplace(Block & block, const Names & names);
-ColumnPtrMap materializeColumnsInplaceMap(const Block & block, const Names & names);
 ColumnRawPtrs getRawPointers(const Columns & columns);
-void convertToFullColumnsInplace(Block & block);
-void convertToFullColumnsInplace(Block & block, const Names & names, bool change_type = true);
 void restoreLowCardinalityInplace(Block & block, const Names & lowcard_keys);
 
 ColumnRawPtrs extractKeysForJoin(const Block & block_keys, const Names & key_names_right);
diff --git a/src/Interpreters/MergeJoin.cpp b/src/Interpreters/MergeJoin.cpp
index 30c62386ca3..f0427b5a6ca 100644
--- a/src/Interpreters/MergeJoin.cpp
+++ b/src/Interpreters/MergeJoin.cpp
@@ -138,6 +138,9 @@ Block extractMinMax(const Block & block, const Block & keys)
     }
 
     min_max.setColumns(std::move(columns));
+
+    for (auto & column : min_max)
+        column.column = column.column->convertToFullColumnIfLowCardinality();
     return min_max;
 }
 
@@ -224,6 +227,16 @@ public:
     MergeJoinCursor(const Block & block, const SortDescription & desc_)
         : impl(block, desc_)
     {
+        for (auto *& column : impl.sort_columns)
+        {
+            const auto * lowcard_column = typeid_cast<const ColumnLowCardinality *>(column);
+            if (lowcard_column)
+            {
+                auto & new_col = column_holder.emplace_back(lowcard_column->convertToFullColumn());
+                column = new_col.get();
+            }
+        }
+
         /// SortCursorImpl can work with permutation, but MergeJoinCursor can't.
         if (impl.permutation)
             throw Exception(ErrorCodes::LOGICAL_ERROR, "Logical error: MergeJoinCursor doesn't support permutation");
@@ -287,6 +300,7 @@ public:
 
 private:
     SortCursorImpl impl;
+    Columns column_holder;
     bool has_left_nullable = false;
     bool has_right_nullable = false;
 
@@ -537,9 +551,6 @@ MergeJoin::MergeJoin(std::shared_ptr<TableJoin> table_join_, const Block & right
             lowcard_right_keys.push_back(right_key);
     }
 
-    JoinCommon::convertToFullColumnsInplace(right_table_keys);
-    JoinCommon::convertToFullColumnsInplace(right_sample_block, key_names_right);
-
     for (const auto & column : right_table_keys)
         if (required_right_keys.contains(column.name))
             right_columns_to_add.insert(ColumnWithTypeAndName{nullptr, column.type, column.name});
@@ -662,9 +673,7 @@ bool MergeJoin::saveRightBlock(Block && block)
 
 Block MergeJoin::modifyRightBlock(const Block & src_block) const
 {
-    Block block = materializeBlock(src_block);
-    JoinCommon::convertToFullColumnsInplace(block, table_join->getOnlyClause().key_names_right);
-    return block;
+    return materializeBlock(src_block);
 }
 
 bool MergeJoin::addBlockToJoin(const Block & src_block, bool)
@@ -705,8 +714,6 @@ void MergeJoin::joinBlock(Block & block, ExtraBlockPtr & not_processed)
                 lowcard_keys.push_back(column_name);
         }
 
-        JoinCommon::convertToFullColumnsInplace(block, key_names_left, false);
-
         sortBlock(block, left_sort_description);
     }
 
@@ -739,8 +746,6 @@ void MergeJoin::joinBlock(Block & block, ExtraBlockPtr & not_processed)
 
     if (needConditionJoinColumn())
         block.erase(deriveTempName(mask_column_name_left, JoinTableSide::Left));
-
-    JoinCommon::restoreLowCardinalityInplace(block, lowcard_keys);
 }
 
 template <bool in_memory, bool is_all>
diff --git a/src/Interpreters/MetricLog.cpp b/src/Interpreters/MetricLog.cpp
index 91ba0f64e9b..7993bda4bd9 100644
--- a/src/Interpreters/MetricLog.cpp
+++ b/src/Interpreters/MetricLog.cpp
@@ -1,9 +1,12 @@
+#include <base/getFQDNOrHostName.h>
 #include <Interpreters/MetricLog.h>
 #include <Common/ThreadPool.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeDateTime64.h>
+#include <DataTypes/DataTypeString.h>
 
 
 namespace DB
@@ -13,6 +16,7 @@ NamesAndTypesList MetricLogElement::getNamesAndTypes()
 {
     NamesAndTypesList columns_with_type_and_name;
 
+    columns_with_type_and_name.emplace_back("hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>()));
     columns_with_type_and_name.emplace_back("event_date", std::make_shared<DataTypeDate>());
     columns_with_type_and_name.emplace_back("event_time", std::make_shared<DataTypeDateTime>());
     columns_with_type_and_name.emplace_back("event_time_microseconds", std::make_shared<DataTypeDateTime64>(6));
@@ -41,6 +45,7 @@ void MetricLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t column_idx = 0;
 
+    columns[column_idx++]->insert(getFQDNOrHostName());
     columns[column_idx++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[column_idx++]->insert(event_time);
     columns[column_idx++]->insert(event_time_microseconds);
diff --git a/src/Interpreters/MutationsInterpreter.cpp b/src/Interpreters/MutationsInterpreter.cpp
index 8e56b08f1ed..bf50766c165 100644
--- a/src/Interpreters/MutationsInterpreter.cpp
+++ b/src/Interpreters/MutationsInterpreter.cpp
@@ -26,6 +26,7 @@
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/formatAST.h>
+#include <Parsers/queryToString.h>
 #include <IO/WriteHelpers.h>
 #include <Processors/QueryPlan/CreatingSetsStep.h>
 #include <DataTypes/NestedUtils.h>
@@ -153,19 +154,29 @@ bool isStorageTouchedByMutations(
         return false;
 
     bool all_commands_can_be_skipped = true;
-    for (const MutationCommand & command : commands)
+    for (const auto & command : commands)
     {
-        if (!command.predicate) /// The command touches all rows.
-            return true;
-
-        if (command.partition)
+        if (command.type == MutationCommand::APPLY_DELETED_MASK)
         {
-            const String partition_id = storage.getPartitionIDFromQuery(command.partition, context);
-            if (partition_id == source_part->info.partition_id)
-                all_commands_can_be_skipped = false;
+            if (source_part->hasLightweightDelete())
+                return true;
         }
         else
-            all_commands_can_be_skipped = false;
+        {
+            if (!command.predicate) /// The command touches all rows.
+                return true;
+
+            if (command.partition)
+            {
+                const String partition_id = storage.getPartitionIDFromQuery(command.partition, context);
+                if (partition_id == source_part->info.partition_id)
+                    all_commands_can_be_skipped = false;
+            }
+            else
+            {
+                all_commands_can_be_skipped = false;
+            }
+        }
     }
 
     if (all_commands_can_be_skipped)
@@ -211,7 +222,6 @@ bool isStorageTouchedByMutations(
     return count != 0;
 }
 
-
 ASTPtr getPartitionAndPredicateExpressionForMutationCommand(
     const MutationCommand & command,
     const StoragePtr & storage,
@@ -244,6 +254,32 @@ ASTPtr getPartitionAndPredicateExpressionForMutationCommand(
         return command.predicate ? command.predicate->clone() : partition_predicate_as_ast_func;
 }
 
+
+MutationCommand createCommandToApplyDeletedMask(const MutationCommand & command)
+{
+    if (command.type != MutationCommand::APPLY_DELETED_MASK)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Expected APPLY_DELETED_MASK mutation command, got: {}", magic_enum::enum_name(command.type));
+
+    auto alter_command = std::make_shared<ASTAlterCommand>();
+    alter_command->type = ASTAlterCommand::DELETE;
+    alter_command->partition = command.partition;
+
+    auto row_exists_predicate = makeASTFunction("equals",
+        std::make_shared<ASTIdentifier>(LightweightDeleteDescription::FILTER_COLUMN.name),
+        std::make_shared<ASTLiteral>(Field(0)));
+
+    if (command.predicate)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Mutation command APPLY DELETED MASK does not support WHERE clause");
+
+    alter_command->predicate = row_exists_predicate;
+
+    auto mutation_command = MutationCommand::parse(alter_command.get());
+    if (!mutation_command)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Failed to parse command {}. It's a bug", queryToString(alter_command));
+
+    return *mutation_command;
+}
+
 MutationsInterpreter::Source::Source(StoragePtr storage_) : storage(std::move(storage_))
 {
 }
@@ -517,15 +553,18 @@ void MutationsInterpreter::prepare(bool dry_run)
     NameSet updated_columns;
     bool materialize_ttl_recalculate_only = source.materializeTTLRecalculateOnly();
 
-    for (const MutationCommand & command : commands)
+    for (auto & command : commands)
     {
-        if (command.type == MutationCommand::Type::UPDATE
-            || command.type == MutationCommand::Type::DELETE)
+        if (command.type == MutationCommand::Type::APPLY_DELETED_MASK)
+            command = createCommandToApplyDeletedMask(command);
+
+        if (command.type == MutationCommand::Type::UPDATE || command.type == MutationCommand::Type::DELETE)
             materialize_ttl_recalculate_only = false;
 
         for (const auto & [name, _] : command.column_to_update_expression)
         {
-            if (!available_columns_set.contains(name) && name != LightweightDeleteDescription::FILTER_COLUMN.name
+            if (!available_columns_set.contains(name)
+                && name != LightweightDeleteDescription::FILTER_COLUMN.name
                 && name != BlockNumberColumn::name)
                 throw Exception(ErrorCodes::THERE_IS_NO_COLUMN,
                     "Column {} is updated but not requested to read", name);
@@ -574,7 +613,7 @@ void MutationsInterpreter::prepare(bool dry_run)
     std::vector<String> read_columns;
 
     /// First, break a sequence of commands into stages.
-    for (auto & command : commands)
+    for (const auto & command : commands)
     {
         // we can return deleted rows only if it's the only present command
         assert(command.type == MutationCommand::DELETE || command.type == MutationCommand::UPDATE || !settings.return_mutated_rows);
@@ -585,7 +624,7 @@ void MutationsInterpreter::prepare(bool dry_run)
             if (stages.empty() || !stages.back().column_to_updated.empty())
                 stages.emplace_back(context);
 
-            auto predicate  = getPartitionAndPredicateExpressionForMutationCommand(command);
+            auto predicate = getPartitionAndPredicateExpressionForMutationCommand(command);
 
             if (!settings.return_mutated_rows)
                 predicate = makeASTFunction("isZeroOrNull", predicate);
@@ -605,16 +644,12 @@ void MutationsInterpreter::prepare(bool dry_run)
 
             NameSet affected_materialized;
 
-            for (const auto & kv : command.column_to_update_expression)
+            for (const auto & [column_name, update_expr] : command.column_to_update_expression)
             {
-                const String & column = kv.first;
-
-                auto materialized_it = column_to_affected_materialized.find(column);
+                auto materialized_it = column_to_affected_materialized.find(column_name);
                 if (materialized_it != column_to_affected_materialized.end())
-                {
-                    for (const String & mat_column : materialized_it->second)
+                    for (const auto & mat_column : materialized_it->second)
                         affected_materialized.emplace(mat_column);
-                }
 
                 /// When doing UPDATE column = expression WHERE condition
                 /// we will replace column to the result of the following expression:
@@ -627,33 +662,39 @@ void MutationsInterpreter::prepare(bool dry_run)
                 /// Outer CAST is added just in case if we don't trust the returning type of 'if'.
 
                 DataTypePtr type;
-                if (auto physical_column = columns_desc.tryGetPhysical(column))
+                if (auto physical_column = columns_desc.tryGetPhysical(column_name))
+                {
                     type = physical_column->type;
-                else if (column == LightweightDeleteDescription::FILTER_COLUMN.name)
+                }
+                else if (column_name == LightweightDeleteDescription::FILTER_COLUMN.name)
+                {
                     type = LightweightDeleteDescription::FILTER_COLUMN.type;
-                else if (column == BlockNumberColumn::name)
+                    deleted_mask_updated = true;
+                }
+                else if (column_name == BlockNumberColumn::name)
+                {
                     type = BlockNumberColumn::type;
+                }
                 else
-                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown column {}", column);
+                {
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Unknown column {}", column_name);
+                }
 
                 auto type_literal = std::make_shared<ASTLiteral>(type->getName());
-
-                const auto & update_expr = kv.second;
-
                 ASTPtr condition = getPartitionAndPredicateExpressionForMutationCommand(command);
 
                 /// And new check validateNestedArraySizes for Nested subcolumns
-                if (isArray(type) && !Nested::splitName(column).second.empty())
+                if (isArray(type) && !Nested::splitName(column_name).second.empty())
                 {
                     std::shared_ptr<ASTFunction> function = nullptr;
 
-                    auto nested_update_exprs = getExpressionsOfUpdatedNestedSubcolumns(column, all_columns, command.column_to_update_expression);
+                    auto nested_update_exprs = getExpressionsOfUpdatedNestedSubcolumns(column_name, all_columns, command.column_to_update_expression);
                     if (!nested_update_exprs)
                     {
                         function = makeASTFunction("validateNestedArraySizes",
                             condition,
                             update_expr->clone(),
-                            std::make_shared<ASTIdentifier>(column));
+                            std::make_shared<ASTIdentifier>(column_name));
                         condition = makeASTFunction("and", condition, function);
                     }
                     else if (nested_update_exprs->size() > 1)
@@ -675,10 +716,10 @@ void MutationsInterpreter::prepare(bool dry_run)
                         makeASTFunction("_CAST",
                             update_expr->clone(),
                             type_literal),
-                        std::make_shared<ASTIdentifier>(column)),
+                        std::make_shared<ASTIdentifier>(column_name)),
                     type_literal);
 
-                stages.back().column_to_updated.emplace(column, updated_column);
+                stages.back().column_to_updated.emplace(column_name, updated_column);
 
                 if (condition && settings.return_mutated_rows)
                     stages.back().filters.push_back(condition);
@@ -986,27 +1027,42 @@ void MutationsInterpreter::prepareMutationStages(std::vector<Stage> & prepared_s
     auto all_columns = storage_snapshot->getColumnsByNames(options, available_columns);
 
     /// Add _row_exists column if it is present in the part
-    if (source.hasLightweightDeleteMask())
-        all_columns.push_back({LightweightDeleteDescription::FILTER_COLUMN});
+    if (source.hasLightweightDeleteMask() || deleted_mask_updated)
+        all_columns.push_back(LightweightDeleteDescription::FILTER_COLUMN);
 
+    bool has_filters = false;
     /// Next, for each stage calculate columns changed by this and previous stages.
     for (size_t i = 0; i < prepared_stages.size(); ++i)
     {
         if (settings.return_all_columns || !prepared_stages[i].filters.empty())
         {
             for (const auto & column : all_columns)
+            {
+                if (column.name == LightweightDeleteDescription::FILTER_COLUMN.name && !deleted_mask_updated)
+                    continue;
+
                 prepared_stages[i].output_columns.insert(column.name);
-            continue;
+            }
+
+            has_filters = true;
+            settings.apply_deleted_mask = true;
         }
+        else
+        {
+            if (i > 0)
+                prepared_stages[i].output_columns = prepared_stages[i - 1].output_columns;
 
-        if (i > 0)
-            prepared_stages[i].output_columns = prepared_stages[i - 1].output_columns;
+            /// Make sure that all updated columns are included into output_columns set.
+            /// This is important for a "hidden" column like _row_exists gets because it is a virtual column
+            /// and so it is not in the list of AllPhysical columns.
+            for (const auto & [column_name, _] : prepared_stages[i].column_to_updated)
+            {
+                if (column_name == LightweightDeleteDescription::FILTER_COLUMN.name && has_filters && !deleted_mask_updated)
+                    continue;
 
-        /// Make sure that all updated columns are included into output_columns set.
-        /// This is important for a "hidden" column like _row_exists gets because it is a virtual column
-        /// and so it is not in the list of AllPhysical columns.
-        for (const auto & kv : prepared_stages[i].column_to_updated)
-            prepared_stages[i].output_columns.insert(kv.first);
+                prepared_stages[i].output_columns.insert(column_name);
+            }
+        }
     }
 
     /// Now, calculate `expressions_chain` for each stage except the first.
@@ -1024,7 +1080,7 @@ void MutationsInterpreter::prepareMutationStages(std::vector<Stage> & prepared_s
             all_asts->children.push_back(kv.second);
 
         /// Add all output columns to prevent ExpressionAnalyzer from deleting them from source columns.
-        for (const String & column : stage.output_columns)
+        for (const auto & column : stage.output_columns)
             all_asts->children.push_back(std::make_shared<ASTIdentifier>(column));
 
         /// Executing scalar subquery on that stage can lead to deadlock
@@ -1081,7 +1137,6 @@ void MutationsInterpreter::prepareMutationStages(std::vector<Stage> & prepared_s
             actions_chain.getLastStep().addRequiredOutput(name);
 
         actions_chain.getLastActions();
-
         actions_chain.finalize();
 
         if (i)
@@ -1224,7 +1279,7 @@ void MutationsInterpreter::Source::read(
 
         VirtualColumns virtual_columns(std::move(required_columns), part);
 
-        createMergeTreeSequentialSource(
+        createReadFromPartStep(
             plan, *data, storage_snapshot, part,
             std::move(virtual_columns.columns_to_read),
             apply_deleted_mask_, filter, context_,
diff --git a/src/Interpreters/MutationsInterpreter.h b/src/Interpreters/MutationsInterpreter.h
index 1372ea77f4f..eda94190185 100644
--- a/src/Interpreters/MutationsInterpreter.h
+++ b/src/Interpreters/MutationsInterpreter.h
@@ -32,6 +32,8 @@ ASTPtr getPartitionAndPredicateExpressionForMutationCommand(
     ContextPtr context
 );
 
+MutationCommand createCommandToApplyDeletedMask(const MutationCommand & command);
+
 /// Create an input stream that will read data from storage and apply mutation commands (UPDATEs, DELETEs, MATERIALIZEs)
 /// to this data.
 class MutationsInterpreter
@@ -213,6 +215,7 @@ private:
     std::unique_ptr<Block> updated_header;
     std::vector<Stage> stages;
     bool is_prepared = false; /// Has the sequence of stages been prepared.
+    bool deleted_mask_updated = false;
 
     NameSet materialized_indices;
     NameSet materialized_projections;
diff --git a/src/Interpreters/OpenTelemetrySpanLog.cpp b/src/Interpreters/OpenTelemetrySpanLog.cpp
index 610330b8559..40aaa63dd6e 100644
--- a/src/Interpreters/OpenTelemetrySpanLog.cpp
+++ b/src/Interpreters/OpenTelemetrySpanLog.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/OpenTelemetrySpanLog.h>
 
+#include <base/getFQDNOrHostName.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
@@ -30,6 +31,7 @@ NamesAndTypesList OpenTelemetrySpanLogElement::getNamesAndTypes()
     auto low_cardinality_string = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
 
     return {
+        {"hostname", low_cardinality_string},
         {"trace_id", std::make_shared<DataTypeUUID>()},
         {"span_id", std::make_shared<DataTypeUInt64>()},
         {"parent_span_id", std::make_shared<DataTypeUInt64>()},
@@ -67,6 +69,7 @@ void OpenTelemetrySpanLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(trace_id);
     columns[i++]->insert(span_id);
     columns[i++]->insert(parent_span_id);
diff --git a/src/Interpreters/PartLog.cpp b/src/Interpreters/PartLog.cpp
index d0344468153..338775bfb0c 100644
--- a/src/Interpreters/PartLog.cpp
+++ b/src/Interpreters/PartLog.cpp
@@ -1,3 +1,5 @@
+#include <base/getFQDNOrHostName.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <Columns/ColumnsNumber.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypesNumber.h>
@@ -91,6 +93,7 @@ NamesAndTypesList PartLogElement::getNamesAndTypes()
     ColumnsWithTypeAndName columns_with_type_and_name;
 
     return {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"query_id", std::make_shared<DataTypeString>()},
         {"event_type", std::move(event_type_datatype)},
         {"merge_reason", std::move(merge_reason_datatype)},
@@ -144,6 +147,7 @@ void PartLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(query_id);
     columns[i++]->insert(event_type);
     columns[i++]->insert(merge_reason);
@@ -241,6 +245,7 @@ bool PartLog::addNewParts(
             elem.part_type = part->getType();
 
             elem.bytes_compressed_on_disk = part->getBytesOnDisk();
+            elem.bytes_uncompressed = part->getBytesUncompressedOnDisk();
             elem.rows = part->rows_count;
 
             elem.error = static_cast<UInt16>(execution_status.code);
diff --git a/src/Interpreters/PasteJoin.h b/src/Interpreters/PasteJoin.h
new file mode 100644
index 00000000000..df7bb2f280c
--- /dev/null
+++ b/src/Interpreters/PasteJoin.h
@@ -0,0 +1,96 @@
+#pragma once
+
+#include <Interpreters/IJoin.h>
+#include <Interpreters/TableJoin.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeLowCardinality.h>
+#include <Common/logger_useful.h>
+#include <Poco/Logger.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
+}
+
+/// Dummy class, actual joining is done by MergeTransform
+class PasteJoin : public IJoin
+{
+public:
+    explicit PasteJoin(std::shared_ptr<TableJoin> table_join_, const Block & right_sample_block_)
+        : table_join(table_join_)
+        , right_sample_block(right_sample_block_)
+    {
+        LOG_TRACE(&Poco::Logger::get("PasteJoin"), "Will use paste join");
+    }
+
+    std::string getName() const override { return "PasteJoin"; }
+    const TableJoin & getTableJoin() const override { return *table_join; }
+
+    bool addBlockToJoin(const Block & /* block */, bool /* check_limits */) override
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "PasteJoin::addBlockToJoin should not be called");
+    }
+
+    static bool isSupported(const std::shared_ptr<TableJoin> & table_join)
+    {
+        bool support_storage = !table_join->isSpecialStorage();
+
+        /// Key column can change nullability and it's not handled on type conversion stage, so algorithm should be aware of it
+        bool support_using = !table_join->hasUsing();
+
+        bool check_strictness = table_join->strictness() == JoinStrictness::All;
+
+        bool if_has_keys = table_join->getClauses().empty();
+
+        return support_using && support_storage && check_strictness && if_has_keys;
+    }
+
+    void checkTypesOfKeys(const Block & /*left_block*/) const override
+    {
+        if (!isSupported(table_join))
+            throw DB::Exception(ErrorCodes::NOT_IMPLEMENTED, "PasteJoin doesn't support specified query");
+    }
+
+    /// Used just to get result header
+    void joinBlock(Block & block, std::shared_ptr<ExtraBlock> & /* not_processed */) override
+    {
+        for (const auto & col : right_sample_block)
+            block.insert(col);
+        block = materializeBlock(block).cloneEmpty();
+    }
+
+    void setTotals(const Block & block) override { totals = block; }
+    const Block & getTotals() const override { return totals; }
+
+    size_t getTotalRowCount() const override
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "PasteJoin::getTotalRowCount should not be called");
+    }
+
+    size_t getTotalByteCount() const override
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "PasteJoin::getTotalByteCount should not be called");
+    }
+
+    bool alwaysReturnsEmptySet() const override { return false; }
+
+    IBlocksStreamPtr
+    getNonJoinedBlocks(const Block & /* left_sample_block */, const Block & /* result_sample_block */, UInt64 /* max_block_size */) const override
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "PasteJoin::getNonJoinedBlocks should not be called");
+    }
+
+    /// Left and right streams have the same priority and are processed simultaneously
+    JoinPipelineType pipelineType() const override { return JoinPipelineType::YShaped; }
+
+private:
+    std::shared_ptr<TableJoin> table_join;
+    Block right_sample_block;
+    Block totals;
+};
+
+}
diff --git a/src/Interpreters/PreparedSets.cpp b/src/Interpreters/PreparedSets.cpp
index 955d8892284..18a25482b7f 100644
--- a/src/Interpreters/PreparedSets.cpp
+++ b/src/Interpreters/PreparedSets.cpp
@@ -98,10 +98,12 @@ FutureSetFromSubquery::FutureSetFromSubquery(
     std::unique_ptr<QueryPlan> source_,
     StoragePtr external_table_,
     FutureSetPtr external_table_set_,
-    const Settings & settings)
+    const Settings & settings,
+    bool in_subquery_)
     : external_table(std::move(external_table_))
     , external_table_set(std::move(external_table_set_))
     , source(std::move(source_))
+    , in_subquery(in_subquery_)
 {
     set_and_key = std::make_shared<SetAndKey>();
     set_and_key->key = std::move(key);
@@ -261,14 +263,16 @@ FutureSetPtr PreparedSets::addFromSubquery(
     std::unique_ptr<QueryPlan> source,
     StoragePtr external_table,
     FutureSetPtr external_table_set,
-    const Settings & settings)
+    const Settings & settings,
+    bool in_subquery)
 {
     auto from_subquery = std::make_shared<FutureSetFromSubquery>(
         toString(key, {}),
         std::move(source),
         std::move(external_table),
         std::move(external_table_set),
-        settings);
+        settings,
+        in_subquery);
 
     auto [it, inserted] = sets_from_subqueries.emplace(key, from_subquery);
 
@@ -318,6 +322,15 @@ std::shared_ptr<FutureSetFromSubquery> PreparedSets::findSubquery(const Hash & k
     return it->second;
 }
 
+void PreparedSets::markAsINSubquery(const Hash & key)
+{
+    auto it = sets_from_subqueries.find(key);
+    if (it == sets_from_subqueries.end())
+        return;
+
+    it->second->markAsINSubquery();
+}
+
 std::shared_ptr<FutureSetFromStorage> PreparedSets::findStorage(const Hash & key) const
 {
     auto it = sets_from_storage.find(key);
@@ -327,11 +340,11 @@ std::shared_ptr<FutureSetFromStorage> PreparedSets::findStorage(const Hash & key
     return it->second;
 }
 
-PreparedSets::Subqueries PreparedSets::getSubqueries()
+PreparedSets::Subqueries PreparedSets::getSubqueries() const
 {
     PreparedSets::Subqueries res;
     res.reserve(sets_from_subqueries.size());
-    for (auto & [_, set] : sets_from_subqueries)
+    for (const auto & [_, set] : sets_from_subqueries)
         res.push_back(set);
 
     return res;
diff --git a/src/Interpreters/PreparedSets.h b/src/Interpreters/PreparedSets.h
index e237789c63c..9f8bac9f71c 100644
--- a/src/Interpreters/PreparedSets.h
+++ b/src/Interpreters/PreparedSets.h
@@ -59,7 +59,7 @@ using FutureSetPtr = std::shared_ptr<FutureSet>;
 class FutureSetFromStorage final : public FutureSet
 {
 public:
-    FutureSetFromStorage(SetPtr set_);
+    explicit FutureSetFromStorage(SetPtr set_);
 
     SetPtr get() const override;
     DataTypes getTypes() const override;
@@ -97,7 +97,8 @@ public:
         std::unique_ptr<QueryPlan> source_,
         StoragePtr external_table_,
         FutureSetPtr external_table_set_,
-        const Settings & settings);
+        const Settings & settings,
+        bool in_subquery_);
 
     FutureSetFromSubquery(
         String key,
@@ -112,6 +113,8 @@ public:
 
     QueryTreeNodePtr detachQueryTree() { return std::move(query_tree); }
     void setQueryPlan(std::unique_ptr<QueryPlan> source_);
+    void markAsINSubquery() { in_subquery = true; }
+    bool isINSubquery() const { return in_subquery; }
 
 private:
     SetAndKeyPtr set_and_key;
@@ -120,6 +123,11 @@ private:
 
     std::unique_ptr<QueryPlan> source;
     QueryTreeNodePtr query_tree;
+    bool in_subquery = false; // subquery used in IN operator
+                              // the flag can be removed after enabling new analyzer and removing interpreter
+                              // or after enabling support IN operator with subqueries in parallel replicas
+                              // Note: it's necessary with interpreter since prepared sets used also for GLOBAL JOINs,
+                              //       with new analyzer it's not a case
 };
 
 /// Container for all the sets used in query.
@@ -145,7 +153,8 @@ public:
         std::unique_ptr<QueryPlan> source,
         StoragePtr external_table,
         FutureSetPtr external_table_set,
-        const Settings & settings);
+        const Settings & settings,
+        bool in_subquery = false);
 
     FutureSetPtr addFromSubquery(
         const Hash & key,
@@ -155,9 +164,11 @@ public:
     FutureSetPtr findTuple(const Hash & key, const DataTypes & types) const;
     std::shared_ptr<FutureSetFromStorage> findStorage(const Hash & key) const;
     std::shared_ptr<FutureSetFromSubquery> findSubquery(const Hash & key) const;
+    void markAsINSubquery(const Hash & key);
 
     using Subqueries = std::vector<std::shared_ptr<FutureSetFromSubquery>>;
-    Subqueries getSubqueries();
+    Subqueries getSubqueries() const;
+    bool hasSubqueries() const { return !sets_from_subqueries.empty(); }
 
     const SetsFromTuple & getSetsFromTuple() const { return sets_from_tuple; }
     // const SetsFromStorage & getSetsFromStorage() const { return sets_from_storage; }
diff --git a/src/Interpreters/ProcessorsProfileLog.cpp b/src/Interpreters/ProcessorsProfileLog.cpp
index 14159ad3438..68b5d63e613 100644
--- a/src/Interpreters/ProcessorsProfileLog.cpp
+++ b/src/Interpreters/ProcessorsProfileLog.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/ProcessorsProfileLog.h>
 
+#include <base/getFQDNOrHostName.h>
 #include <Common/ClickHouseRevision.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
@@ -20,6 +21,7 @@ NamesAndTypesList ProcessorProfileLogElement::getNamesAndTypes()
 {
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"event_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
@@ -46,6 +48,7 @@ void ProcessorProfileLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
     columns[i++]->insert(event_time_microseconds);
diff --git a/src/Interpreters/QueryLog.cpp b/src/Interpreters/QueryLog.cpp
index 57f3968fba1..1e259bb510e 100644
--- a/src/Interpreters/QueryLog.cpp
+++ b/src/Interpreters/QueryLog.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/QueryLog.h>
 
+#include <base/getFQDNOrHostName.h>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnString.h>
@@ -55,6 +56,7 @@ NamesAndTypesList QueryLogElement::getNamesAndTypes()
 
     return
     {
+        {"hostname", low_cardinality_string},
         {"type", std::move(query_status_datatype)},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
@@ -160,6 +162,7 @@ void QueryLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(type);
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
diff --git a/src/Interpreters/QueryThreadLog.cpp b/src/Interpreters/QueryThreadLog.cpp
index fe9c8f91d30..eed2a38e6da 100644
--- a/src/Interpreters/QueryThreadLog.cpp
+++ b/src/Interpreters/QueryThreadLog.cpp
@@ -1,5 +1,6 @@
 #include "QueryThreadLog.h"
 #include <array>
+#include <base/getFQDNOrHostName.h>
 #include <Columns/ColumnFixedString.h>
 #include <Columns/ColumnString.h>
 #include <Columns/ColumnsNumber.h>
@@ -27,6 +28,7 @@ NamesAndTypesList QueryThreadLogElement::getNamesAndTypes()
 
     return
     {
+        {"hostname", low_cardinality_string},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"event_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
@@ -94,6 +96,7 @@ void QueryThreadLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
     columns[i++]->insert(event_time_microseconds);
diff --git a/src/Interpreters/QueryViewsLog.cpp b/src/Interpreters/QueryViewsLog.cpp
index fc235d0d1cd..7ad3e668bbb 100644
--- a/src/Interpreters/QueryViewsLog.cpp
+++ b/src/Interpreters/QueryViewsLog.cpp
@@ -1,5 +1,6 @@
 #include "QueryViewsLog.h"
 
+#include<base/getFQDNOrHostName.h>
 #include <Columns/IColumn.h>
 #include <Core/Block.h>
 #include <DataTypes/DataTypeArray.h>
@@ -7,6 +8,7 @@
 #include <DataTypes/DataTypeDateTime.h>
 #include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/DataTypeEnum.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeMap.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeUUID.h>
@@ -32,6 +34,7 @@ NamesAndTypesList QueryViewsLogElement::getNamesAndTypes()
         {"Window", static_cast<Int8>(ViewType::WINDOW)}});
 
     return {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"event_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
@@ -68,6 +71,7 @@ void QueryViewsLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType()); // event_date
     columns[i++]->insert(event_time);
     columns[i++]->insert(event_time_microseconds);
diff --git a/src/Interpreters/RequiredSourceColumnsVisitor.cpp b/src/Interpreters/RequiredSourceColumnsVisitor.cpp
index 1bcec02f0c0..c07d783788a 100644
--- a/src/Interpreters/RequiredSourceColumnsVisitor.cpp
+++ b/src/Interpreters/RequiredSourceColumnsVisitor.cpp
@@ -8,6 +8,7 @@
 #include <Parsers/ASTSubquery.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
 #include <Parsers/ASTInterpolateElement.h>
+#include <Parsers/ASTLiteral.h>
 
 namespace DB
 {
@@ -126,7 +127,7 @@ void RequiredSourceColumnsMatcher::visit(const ASTSelectQuery & select, const AS
 
         if (const auto * identifier = node->as<ASTIdentifier>())
             data.addColumnIdentifier(*identifier);
-        else
+        else if (!node->as<ASTLiteral>())
             data.addColumnAliasIfAny(*node);
     }
 
diff --git a/src/Interpreters/S3QueueLog.cpp b/src/Interpreters/S3QueueLog.cpp
index 4e43aae6b0d..fdf74b2b926 100644
--- a/src/Interpreters/S3QueueLog.cpp
+++ b/src/Interpreters/S3QueueLog.cpp
@@ -1,5 +1,7 @@
+#include <base/getFQDNOrHostName.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeNullable.h>
@@ -21,6 +23,7 @@ NamesAndTypesList S3QueueLogElement::getNamesAndTypes()
             {"Failed", static_cast<Int8>(S3QueueLogElement::S3QueueStatus::Failed)},
         });
     return {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"table_uuid", std::make_shared<DataTypeString>()},
@@ -37,6 +40,7 @@ NamesAndTypesList S3QueueLogElement::getNamesAndTypes()
 void S3QueueLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
     columns[i++]->insert(table_uuid);
diff --git a/src/Interpreters/ServerAsynchronousMetrics.cpp b/src/Interpreters/ServerAsynchronousMetrics.cpp
index 84d31bae13f..31d4a4e51a4 100644
--- a/src/Interpreters/ServerAsynchronousMetrics.cpp
+++ b/src/Interpreters/ServerAsynchronousMetrics.cpp
@@ -54,8 +54,8 @@ ServerAsynchronousMetrics::ServerAsynchronousMetrics(
     int update_period_seconds,
     int heavy_metrics_update_period_seconds,
     const ProtocolServerMetricsFunc & protocol_server_metrics_func_)
-    : AsynchronousMetrics(update_period_seconds, protocol_server_metrics_func_)
-    , WithContext(global_context_)
+    : WithContext(global_context_)
+    , AsynchronousMetrics(update_period_seconds, protocol_server_metrics_func_)
     , heavy_metric_update_period(heavy_metrics_update_period_seconds)
 {
     /// sanity check
@@ -63,6 +63,12 @@ ServerAsynchronousMetrics::ServerAsynchronousMetrics(
         throw Exception(ErrorCodes::INVALID_SETTING_VALUE, "Setting asynchronous_metrics_update_period_s and asynchronous_heavy_metrics_update_period_s must not be zero");
 }
 
+ServerAsynchronousMetrics::~ServerAsynchronousMetrics()
+{
+    /// NOTE: stop() from base class is not enough, since this leads to leak on vptr
+    stop();
+}
+
 void ServerAsynchronousMetrics::updateImpl(AsynchronousMetricValues & new_values, TimePoint update_time, TimePoint current_time)
 {
     if (auto mark_cache = getContext()->getMarkCache())
@@ -249,6 +255,9 @@ void ServerAsynchronousMetrics::updateImpl(AsynchronousMetricValues & new_values
         size_t total_number_of_rows_system = 0;
         size_t total_number_of_parts_system = 0;
 
+        size_t total_primary_key_bytes_memory = 0;
+        size_t total_primary_key_bytes_memory_allocated = 0;
+
         for (const auto & db : databases)
         {
             /// Check if database can contain MergeTree tables
@@ -287,6 +296,15 @@ void ServerAsynchronousMetrics::updateImpl(AsynchronousMetricValues & new_values
                         total_number_of_rows_system += rows;
                         total_number_of_parts_system += parts;
                     }
+
+                    // only fetch the parts which are in active state
+                    auto all_parts = table_merge_tree->getDataPartsVectorForInternalUsage();
+
+                    for (const auto & part : all_parts)
+                    {
+                        total_primary_key_bytes_memory += part->getIndexSizeInBytes();
+                        total_primary_key_bytes_memory_allocated += part->getIndexSizeInAllocatedBytes();
+                    }
                 }
 
                 if (StorageReplicatedMergeTree * table_replicated_merge_tree = typeid_cast<StorageReplicatedMergeTree *>(table.get()))
@@ -341,11 +359,14 @@ void ServerAsynchronousMetrics::updateImpl(AsynchronousMetricValues & new_values
         new_values["TotalPartsOfMergeTreeTables"] = { total_number_of_parts, "Total amount of data parts in all tables of MergeTree family."
             " Numbers larger than 10 000 will negatively affect the server startup time and it may indicate unreasonable choice of the partition key." };
 
-        new_values["NumberOfTablesSystem"] = { total_number_of_tables_system, "Total number of tables in the system database on the server stored in tables of MergeTree family."};
+        new_values["NumberOfTablesSystem"] = { total_number_of_tables_system, "Total number of tables in the system database on the server stored in tables of MergeTree family." };
 
         new_values["TotalBytesOfMergeTreeTablesSystem"] = { total_number_of_bytes_system, "Total amount of bytes (compressed, including data and indices) stored in tables of MergeTree family in the system database." };
         new_values["TotalRowsOfMergeTreeTablesSystem"] = { total_number_of_rows_system, "Total amount of rows (records) stored in tables of MergeTree family in the system database." };
         new_values["TotalPartsOfMergeTreeTablesSystem"] = { total_number_of_parts_system, "Total amount of data parts in tables of MergeTree family in the system database." };
+
+        new_values["TotalPrimaryKeyBytesInMemory"] = { total_primary_key_bytes_memory, "The total amount of memory (in bytes) used by primary key values (only takes active parts into account)." };
+        new_values["TotalPrimaryKeyBytesInMemoryAllocated"] = { total_primary_key_bytes_memory_allocated, "The total amount of memory (in bytes) reserved for primary key values (only takes active parts into account)." };
     }
 
 #if USE_NURAFT
diff --git a/src/Interpreters/ServerAsynchronousMetrics.h b/src/Interpreters/ServerAsynchronousMetrics.h
index 8243699a111..a579d12de2c 100644
--- a/src/Interpreters/ServerAsynchronousMetrics.h
+++ b/src/Interpreters/ServerAsynchronousMetrics.h
@@ -7,7 +7,7 @@
 namespace DB
 {
 
-class ServerAsynchronousMetrics : public AsynchronousMetrics, WithContext
+class ServerAsynchronousMetrics : WithContext, public AsynchronousMetrics
 {
 public:
     ServerAsynchronousMetrics(
@@ -15,6 +15,8 @@ public:
         int update_period_seconds,
         int heavy_metrics_update_period_seconds,
         const ProtocolServerMetricsFunc & protocol_server_metrics_func_);
+    ~ServerAsynchronousMetrics() override;
+
 private:
     void updateImpl(AsynchronousMetricValues & new_values, TimePoint update_time, TimePoint current_time) override;
     void logImpl(AsynchronousMetricValues & new_values) override;
diff --git a/src/Interpreters/Session.cpp b/src/Interpreters/Session.cpp
index b815b6195de..162772061b5 100644
--- a/src/Interpreters/Session.cpp
+++ b/src/Interpreters/Session.cpp
@@ -15,7 +15,6 @@
 #include <Interpreters/Cluster.h>
 
 #include <magic_enum.hpp>
-#include <Poco/Net/NameValueCollection.h>
 
 #include <atomic>
 #include <condition_variable>
@@ -432,7 +431,7 @@ void Session::setClientConnectionId(uint32_t connection_id)
         prepared_client_info->connection_id = connection_id;
 }
 
-void Session::setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer, const Poco::Net::NameValueCollection & http_headers)
+void Session::setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer)
 {
     if (session_context)
     {
@@ -443,7 +442,6 @@ void Session::setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String
         prepared_client_info->http_method = http_method;
         prepared_client_info->http_user_agent = http_user_agent;
         prepared_client_info->http_referer = http_referer;
-        prepared_client_info->headers = http_headers;
     }
 }
 
diff --git a/src/Interpreters/Session.h b/src/Interpreters/Session.h
index af8148698d3..2249d8fbb2f 100644
--- a/src/Interpreters/Session.h
+++ b/src/Interpreters/Session.h
@@ -5,7 +5,6 @@
 #include <Interpreters/ClientInfo.h>
 #include <Interpreters/Context_fwd.h>
 #include <Interpreters/SessionTracker.h>
-#include <Poco/Net/NameValueCollection.h>
 
 #include <chrono>
 #include <memory>
@@ -65,7 +64,7 @@ public:
     void setClientInterface(ClientInfo::Interface interface);
     void setClientVersion(UInt64 client_version_major, UInt64 client_version_minor, UInt64 client_version_patch, unsigned client_tcp_protocol_version);
     void setClientConnectionId(uint32_t connection_id);
-    void setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer, const Poco::Net::NameValueCollection & http_headers = {});
+    void setHttpClientInfo(ClientInfo::HTTPMethod http_method, const String & http_user_agent, const String & http_referer);
     void setForwardedFor(const String & forwarded_for);
     void setQuotaClientKey(const String & quota_key);
     void setConnectionClientVersion(UInt64 client_version_major, UInt64 client_version_minor, UInt64 client_version_patch, unsigned client_tcp_protocol_version);
diff --git a/src/Interpreters/SessionLog.cpp b/src/Interpreters/SessionLog.cpp
index 2fc5c5b982b..61750b5acca 100644
--- a/src/Interpreters/SessionLog.cpp
+++ b/src/Interpreters/SessionLog.cpp
@@ -1,5 +1,6 @@
 #include <Interpreters/SessionLog.h>
 
+#include <base/getFQDNOrHostName.h>
 #include <Access/ContextAccess.h>
 #include <Access/User.h>
 #include <Access/EnabledRolesInfo.h>
@@ -120,6 +121,7 @@ NamesAndTypesList SessionLogElement::getNamesAndTypes()
 
     return
     {
+        {"hostname", lc_string_datatype},
         {"type", std::move(event_type)},
         {"auth_id", std::make_shared<DataTypeUUID>()},
         {"session_id", std::make_shared<DataTypeString>()},
@@ -156,6 +158,7 @@ void SessionLogElement::appendToBlock(MutableColumns & columns) const
 
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(type);
     columns[i++]->insert(auth_id);
     columns[i++]->insert(session_id);
diff --git a/src/Interpreters/TableJoin.cpp b/src/Interpreters/TableJoin.cpp
index fa289b82aaf..5f3492f0871 100644
--- a/src/Interpreters/TableJoin.cpp
+++ b/src/Interpreters/TableJoin.cpp
@@ -34,6 +34,7 @@
 #include <type_traits>
 #include <vector>
 
+#include <DataTypes/DataTypeLowCardinality.h>
 
 namespace DB
 {
@@ -375,7 +376,7 @@ void TableJoin::addJoinedColumnsAndCorrectTypesImpl(TColumns & left_columns, boo
              * For `JOIN ON expr1 == expr2` we will infer common type later in makeTableJoin,
              *   when part of plan built and types of expression will be known.
              */
-            inferJoinKeyCommonType(left_columns, columns_from_joined_table, !isSpecialStorage(), isEnabledAlgorithm(JoinAlgorithm::FULL_SORTING_MERGE));
+            inferJoinKeyCommonType(left_columns, columns_from_joined_table, !isSpecialStorage());
 
             if (auto it = left_type_map.find(col.name); it != left_type_map.end())
             {
@@ -558,7 +559,8 @@ TableJoin::createConvertingActions(
       */
     NameToNameMap left_column_rename;
     NameToNameMap right_column_rename;
-    inferJoinKeyCommonType(left_sample_columns, right_sample_columns, !isSpecialStorage(), isEnabledAlgorithm(JoinAlgorithm::FULL_SORTING_MERGE));
+
+    inferJoinKeyCommonType(left_sample_columns, right_sample_columns, !isSpecialStorage());
     if (!left_type_map.empty() || !right_type_map.empty())
     {
         left_dag = applyKeyConvertToTable(left_sample_columns, left_type_map, JoinTableSide::Left, left_column_rename);
@@ -612,8 +614,11 @@ TableJoin::createConvertingActions(
 }
 
 template <typename LeftNamesAndTypes, typename RightNamesAndTypes>
-void TableJoin::inferJoinKeyCommonType(const LeftNamesAndTypes & left, const RightNamesAndTypes & right, bool allow_right, bool strict)
+void TableJoin::inferJoinKeyCommonType(const LeftNamesAndTypes & left, const RightNamesAndTypes & right, bool allow_right)
 {
+    /// FullSortingMerge and PartialMerge join algorithms don't support joining keys with different types
+    /// (e.g. String and LowCardinality(String))
+    bool require_strict_keys_match = isEnabledAlgorithm(JoinAlgorithm::FULL_SORTING_MERGE);
     if (!left_type_map.empty() || !right_type_map.empty())
         return;
 
@@ -645,7 +650,7 @@ void TableJoin::inferJoinKeyCommonType(const LeftNamesAndTypes & left, const Rig
         const auto & ltype = ltypeit->second;
         const auto & rtype = rtypeit->second;
 
-        bool type_equals = strict ? ltype->equals(*rtype) : JoinCommon::typesEqualUpToNullability(ltype, rtype);
+        bool type_equals = require_strict_keys_match ? ltype->equals(*rtype) : JoinCommon::typesEqualUpToNullability(ltype, rtype);
         if (type_equals)
             return true;
 
diff --git a/src/Interpreters/TableJoin.h b/src/Interpreters/TableJoin.h
index f97e6a74b8c..247835d9c53 100644
--- a/src/Interpreters/TableJoin.h
+++ b/src/Interpreters/TableJoin.h
@@ -218,7 +218,7 @@ private:
 
     /// Calculates common supertypes for corresponding join key columns.
     template <typename LeftNamesAndTypes, typename RightNamesAndTypes>
-    void inferJoinKeyCommonType(const LeftNamesAndTypes & left, const RightNamesAndTypes & right, bool allow_right, bool strict);
+    void inferJoinKeyCommonType(const LeftNamesAndTypes & left, const RightNamesAndTypes & right, bool allow_right);
 
     void deduplicateAndQualifyColumnNames(const NameSet & left_table_columns, const String & right_table_prefix);
 
diff --git a/src/Interpreters/TemporaryDataOnDisk.cpp b/src/Interpreters/TemporaryDataOnDisk.cpp
index 161535afa68..96aa642295c 100644
--- a/src/Interpreters/TemporaryDataOnDisk.cpp
+++ b/src/Interpreters/TemporaryDataOnDisk.cpp
@@ -106,7 +106,10 @@ FileSegmentsHolderPtr TemporaryDataOnDisk::createCacheFile(size_t max_file_size)
 
     const auto key = FileSegment::Key::random();
     auto holder = file_cache->set(key, 0, std::max(10_MiB, max_file_size), CreateFileSegmentSettings(FileSegmentKind::Temporary, /* unbounded */ true));
-    fs::create_directories(file_cache->getPathInLocalCache(key));
+
+    chassert(holder->size() == 1);
+    holder->back().getKeyMetadata()->createBaseDirectory();
+
     return holder;
 }
 
diff --git a/src/Interpreters/TextLog.cpp b/src/Interpreters/TextLog.cpp
index 36c33a5e7cc..2ea9b805a45 100644
--- a/src/Interpreters/TextLog.cpp
+++ b/src/Interpreters/TextLog.cpp
@@ -1,3 +1,4 @@
+#include <base/getFQDNOrHostName.h>
 #include <Interpreters/TextLog.h>
 
 #include <Common/ClickHouseRevision.h>
@@ -33,6 +34,7 @@ NamesAndTypesList TextLogElement::getNamesAndTypes()
 
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"event_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
@@ -58,6 +60,7 @@ void TextLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
     columns[i++]->insert(event_time_microseconds);
diff --git a/src/Interpreters/ThreadStatusExt.cpp b/src/Interpreters/ThreadStatusExt.cpp
index 3189f093b50..7ae137c01d2 100644
--- a/src/Interpreters/ThreadStatusExt.cpp
+++ b/src/Interpreters/ThreadStatusExt.cpp
@@ -120,7 +120,7 @@ ThreadGroupPtr ThreadGroup::createForBackgroundProcess(ContextPtr storage_contex
 
 void ThreadGroup::attachQueryForLog(const String & query_, UInt64 normalized_hash)
 {
-    auto hash = normalized_hash ? normalized_hash : normalizedQueryHash<false>(query_);
+    auto hash = normalized_hash ? normalized_hash : normalizedQueryHash(query_, false);
 
     std::lock_guard lock(mutex);
     shared_data.query_for_logs = query_;
@@ -130,7 +130,7 @@ void ThreadGroup::attachQueryForLog(const String & query_, UInt64 normalized_has
 void ThreadStatus::attachQueryForLog(const String & query_)
 {
     local_data.query_for_logs = query_;
-    local_data.normalized_query_hash = normalizedQueryHash<false>(query_);
+    local_data.normalized_query_hash = normalizedQueryHash(query_, false);
 
     if (!thread_group)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "No thread group attached to the thread {}", thread_id);
@@ -221,7 +221,7 @@ void ThreadStatus::applyQuerySettings()
         LOG_TRACE(log, "Setting nice to {}", new_os_thread_priority);
 
         if (0 != setpriority(PRIO_PROCESS, static_cast<unsigned>(thread_id), new_os_thread_priority))
-            throwFromErrno("Cannot 'setpriority'", ErrorCodes::CANNOT_SET_THREAD_PRIORITY);
+            throw ErrnoException(ErrorCodes::CANNOT_SET_THREAD_PRIORITY, "Cannot 'setpriority'");
 
         os_thread_priority = new_os_thread_priority;
     }
diff --git a/src/Interpreters/TraceLog.cpp b/src/Interpreters/TraceLog.cpp
index cd5f965a679..d52c3493eaa 100644
--- a/src/Interpreters/TraceLog.cpp
+++ b/src/Interpreters/TraceLog.cpp
@@ -1,3 +1,4 @@
+#include <base/getFQDNOrHostName.h>
 #include <Interpreters/TraceLog.h>
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeString.h>
@@ -28,6 +29,7 @@ NamesAndTypesList TraceLogElement::getNamesAndTypes()
 {
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime>()},
         {"event_time_microseconds", std::make_shared<DataTypeDateTime64>(6)},
@@ -48,6 +50,7 @@ void TraceLogElement::appendToBlock(MutableColumns & columns) const
 {
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time).toUnderType());
     columns[i++]->insert(event_time);
     columns[i++]->insert(event_time_microseconds);
diff --git a/src/Interpreters/TransactionsInfoLog.cpp b/src/Interpreters/TransactionsInfoLog.cpp
index 90f5022a444..18a8b099ba4 100644
--- a/src/Interpreters/TransactionsInfoLog.cpp
+++ b/src/Interpreters/TransactionsInfoLog.cpp
@@ -1,3 +1,4 @@
+#include <base/getFQDNOrHostName.h>
 #include <Interpreters/TransactionsInfoLog.h>
 #include <Interpreters/TransactionVersionMetadata.h>
 #include <Interpreters/Context.h>
@@ -8,6 +9,7 @@
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/DataTypeEnum.h>
 #include <DataTypes/DataTypeFactory.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeUUID.h>
@@ -32,6 +34,7 @@ NamesAndTypesList TransactionsInfoLogElement::getNamesAndTypes()
 
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"type", std::move(type_enum)},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime64>(6)},
@@ -69,6 +72,7 @@ void TransactionsInfoLogElement::appendToBlock(MutableColumns & columns) const
     assert(type != UNKNOWN);
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(type);
     auto event_time_seconds = event_time / 1000000;
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time_seconds).toUnderType());
diff --git a/src/Interpreters/TreeCNFConverter.cpp b/src/Interpreters/TreeCNFConverter.cpp
index 1613b09ee48..d2c7300c80c 100644
--- a/src/Interpreters/TreeCNFConverter.cpp
+++ b/src/Interpreters/TreeCNFConverter.cpp
@@ -2,6 +2,7 @@
 #include <Parsers/IAST.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
+#include <Parsers/queryToString.h>
 #include <Common/checkStackSize.h>
 #include <IO/Operators.h>
 
@@ -239,7 +240,8 @@ CNFQuery TreeCNFConverter::toCNF(
     if (!cnf)
         throw Exception(ErrorCodes::TOO_MANY_TEMPORARY_COLUMNS,
             "Cannot convert expression '{}' to CNF, because it produces to many clauses."
-            "Size of boolean formula in CNF can be exponential of size of source formula.");
+            "Size of boolean formula in CNF can be exponential of size of source formula.",
+            queryToString(query));
 
     return *cnf;
 }
diff --git a/src/Interpreters/TreeRewriter.cpp b/src/Interpreters/TreeRewriter.cpp
index c63aae32090..9cbf24091e3 100644
--- a/src/Interpreters/TreeRewriter.cpp
+++ b/src/Interpreters/TreeRewriter.cpp
@@ -73,6 +73,7 @@ namespace ErrorCodes
     extern const int NOT_IMPLEMENTED;
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int UNKNOWN_IDENTIFIER;
+    extern const int UNEXPECTED_EXPRESSION;
 }
 
 namespace
@@ -776,6 +777,37 @@ void expandGroupByAll(ASTSelectQuery * select_query)
     select_query->setExpression(ASTSelectQuery::Expression::GROUP_BY, group_expression_list);
 }
 
+void expandOrderByAll(ASTSelectQuery * select_query)
+{
+    auto * all_elem = select_query->orderBy()->children[0]->as<ASTOrderByElement>();
+    if (!all_elem)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Select analyze for not order by asts.");
+
+    auto order_expression_list = std::make_shared<ASTExpressionList>();
+
+    for (const auto & expr : select_query->select()->children)
+    {
+        if (auto * identifier = expr->as<ASTIdentifier>(); identifier != nullptr)
+            if (Poco::toUpper(identifier->name()) == "ALL" || Poco::toUpper(identifier->alias) == "ALL")
+                throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
+                                "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
+
+        if (auto * function = expr->as<ASTFunction>(); function != nullptr)
+            if (Poco::toUpper(function->alias) == "ALL")
+                throw Exception(ErrorCodes::UNEXPECTED_EXPRESSION,
+                                "Cannot use ORDER BY ALL to sort a column with name 'all', please disable setting `enable_order_by_all` and try again");
+
+        auto elem = std::make_shared<ASTOrderByElement>();
+        elem->direction = all_elem->direction;
+        elem->nulls_direction = all_elem->nulls_direction;
+        elem->nulls_direction_was_explicitly_specified = all_elem->nulls_direction_was_explicitly_specified;
+        elem->children.push_back(expr);
+        order_expression_list->children.push_back(elem);
+    }
+
+    select_query->setExpression(ASTSelectQuery::Expression::ORDER_BY, order_expression_list);
+}
+
 ASTs getAggregates(ASTPtr & query, const ASTSelectQuery & select_query)
 {
     /// There can not be aggregate functions inside the WHERE and PREWHERE.
@@ -1292,6 +1324,10 @@ TreeRewriterResultPtr TreeRewriter::analyzeSelect(
     if (select_query->group_by_all)
         expandGroupByAll(select_query);
 
+    // expand ORDER BY ALL
+    if (settings.enable_order_by_all && select_query->order_by_all)
+        expandOrderByAll(select_query);
+
     /// Remove unneeded columns according to 'required_result_columns'.
     /// Leave all selected columns in case of DISTINCT; columns that contain arrayJoin function inside.
     /// Must be after 'normalizeTree' (after expanding aliases, for aliases not get lost)
diff --git a/src/Interpreters/ZooKeeperLog.cpp b/src/Interpreters/ZooKeeperLog.cpp
index 5b25ff41d6b..b55a9f540c5 100644
--- a/src/Interpreters/ZooKeeperLog.cpp
+++ b/src/Interpreters/ZooKeeperLog.cpp
@@ -1,3 +1,4 @@
+#include <base/getFQDNOrHostName.h>
 #include <Interpreters/ZooKeeperLog.h>
 #include <Columns/ColumnArray.h>
 #include <Columns/ColumnString.h>
@@ -5,6 +6,7 @@
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/DataTypeDate.h>
+#include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeNullable.h>
 #include <DataTypes/DataTypeEnum.h>
 #include <DataTypes/DataTypeFactory.h>
@@ -51,6 +53,7 @@ DataTypePtr getCoordinationErrorCodesEnumType()
                 {"ZCLOSING",                    static_cast<Int8>(Coordination::Error::ZCLOSING)},
                 {"ZNOTHING",                    static_cast<Int8>(Coordination::Error::ZNOTHING)},
                 {"ZSESSIONMOVED",               static_cast<Int8>(Coordination::Error::ZSESSIONMOVED)},
+                {"ZNOTREADONLY",                static_cast<Int8>(Coordination::Error::ZNOTREADONLY)},
             });
 }
 
@@ -113,11 +116,13 @@ NamesAndTypesList ZooKeeperLogElement::getNamesAndTypes()
                 {"CONNECTING",              static_cast<Int16>(Coordination::State::CONNECTING)},
                 {"ASSOCIATING",             static_cast<Int16>(Coordination::State::ASSOCIATING)},
                 {"CONNECTED",               static_cast<Int16>(Coordination::State::CONNECTED)},
+                {"READONLY",                static_cast<Int16>(Coordination::State::READONLY)},
                 {"NOTCONNECTED",            static_cast<Int16>(Coordination::State::NOTCONNECTED)},
             });
 
     return
     {
+        {"hostname", std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())},
         {"type", std::move(type_enum)},
         {"event_date", std::make_shared<DataTypeDate>()},
         {"event_time", std::make_shared<DataTypeDateTime64>(6)},
@@ -168,6 +173,7 @@ void ZooKeeperLogElement::appendToBlock(MutableColumns & columns) const
     assert(type != UNKNOWN);
     size_t i = 0;
 
+    columns[i++]->insert(getFQDNOrHostName());
     columns[i++]->insert(type);
     auto event_time_seconds = event_time / 1000000;
     columns[i++]->insert(DateLUT::instance().toDayNum(event_time_seconds).toUnderType());
diff --git a/src/Interpreters/executeDDLQueryOnCluster.cpp b/src/Interpreters/executeDDLQueryOnCluster.cpp
index 5d8a9e0582d..9486350a0f6 100644
--- a/src/Interpreters/executeDDLQueryOnCluster.cpp
+++ b/src/Interpreters/executeDDLQueryOnCluster.cpp
@@ -41,12 +41,9 @@ static ZooKeeperRetriesInfo getRetriesInfo()
 {
     const auto & config_ref = Context::getGlobalContextInstance()->getConfigRef();
     return ZooKeeperRetriesInfo(
-        "DistributedDDL",
-        &Poco::Logger::get("DDLQueryStatusSource"),
         config_ref.getInt("distributed_ddl_keeper_max_retries", 5),
         config_ref.getInt("distributed_ddl_keeper_initial_backoff_ms", 100),
-        config_ref.getInt("distributed_ddl_keeper_max_backoff_ms", 5000)
-    );
+        config_ref.getInt("distributed_ddl_keeper_max_backoff_ms", 5000));
 }
 
 bool isSupportedAlterTypeForOnClusterDDLQuery(int type)
@@ -438,8 +435,8 @@ Chunk DDLQueryStatusSource::generate()
         Strings tmp_active_hosts;
 
         {
-            auto retries_info = getRetriesInfo();
-            auto retries_ctl = ZooKeeperRetriesControl("executeDDLQueryOnCluster", retries_info, context->getProcessListElement());
+            auto retries_ctl = ZooKeeperRetriesControl(
+                "executeDDLQueryOnCluster", &Poco::Logger::get("DDLQueryStatusSource"), getRetriesInfo(), context->getProcessListElement());
             retries_ctl.retryLoop([&]()
             {
                 auto zookeeper = context->getZooKeeper();
@@ -478,8 +475,11 @@ Chunk DDLQueryStatusSource::generate()
                 String status_data;
                 bool finished_exists = false;
 
-                auto retries_info = getRetriesInfo();
-                auto retries_ctl = ZooKeeperRetriesControl("executeDDLQueryOnCluster", retries_info, context->getProcessListElement());
+                auto retries_ctl = ZooKeeperRetriesControl(
+                    "executeDDLQueryOnCluster",
+                    &Poco::Logger::get("DDLQueryStatusSource"),
+                    getRetriesInfo(),
+                    context->getProcessListElement());
                 retries_ctl.retryLoop([&]()
                 {
                     finished_exists = context->getZooKeeper()->tryGet(fs::path(node_path) / "finished" / host_id, status_data);
diff --git a/src/Interpreters/executeQuery.cpp b/src/Interpreters/executeQuery.cpp
index 86c223a410b..63804d2d86f 100644
--- a/src/Interpreters/executeQuery.cpp
+++ b/src/Interpreters/executeQuery.cpp
@@ -36,6 +36,9 @@
 #include <Parsers/queryToString.h>
 #include <Parsers/formatAST.h>
 #include <Parsers/toOneLineQuery.h>
+#include <Parsers/Kusto/ParserKQLStatement.h>
+#include <Parsers/PRQL/ParserPRQLQuery.h>
+#include <Parsers/Kusto/parseKQLQuery.h>
 
 #include <Formats/FormatFactory.h>
 #include <Storages/StorageInput.h>
@@ -76,10 +79,6 @@
 #include <memory>
 #include <random>
 
-#include <Parsers/Kusto/ParserKQLStatement.h>
-#include <Parsers/PRQL/ParserPRQLQuery.h>
-#include <Parsers/Kusto/parseKQLQuery.h>
-
 namespace ProfileEvents
 {
     extern const Event FailedQuery;
@@ -299,7 +298,7 @@ QueryLogElement logQueryStart(
     elem.query = query_for_logging;
     if (settings.log_formatted_queries)
         elem.formatted_query = queryToString(query_ast);
-    elem.normalized_query_hash = normalizedQueryHash<false>(query_for_logging);
+    elem.normalized_query_hash = normalizedQueryHash(query_for_logging, false);
     elem.query_kind = query_ast->getQueryKind();
 
     elem.client_info = context->getClientInfo();
@@ -573,7 +572,7 @@ void logExceptionBeforeStart(
 
     elem.current_database = context->getCurrentDatabase();
     elem.query = query_for_logging;
-    elem.normalized_query_hash = normalizedQueryHash<false>(query_for_logging);
+    elem.normalized_query_hash = normalizedQueryHash(query_for_logging, false);
 
     // Log query_kind if ast is valid
     if (ast)
diff --git a/src/Interpreters/fuzzers/execute_query_fuzzer.cpp b/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
index 40e2325e46e..fd023754abf 100644
--- a/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
+++ b/src/Interpreters/fuzzers/execute_query_fuzzer.cpp
@@ -2,6 +2,7 @@
 #include <Interpreters/Context.h>
 #include "Processors/Executors/PullingPipelineExecutor.h"
 
+#include <Functions/registerDatabases.h>
 #include <Functions/registerFunctions.h>
 #include <AggregateFunctions/registerAggregateFunctions.h>
 #include <TableFunctions/registerTableFunctions.h>
@@ -31,6 +32,7 @@ extern "C" int LLVMFuzzerTestOneInput(const uint8_t * data, size_t size)
             registerFunctions();
             registerAggregateFunctions();
             registerTableFunctions();
+            registerDatabases();
             registerStorages();
             registerDictionaries();
             registerDisks(/* global_skip_access_check= */ true);
diff --git a/src/Interpreters/loadMetadata.cpp b/src/Interpreters/loadMetadata.cpp
index 541f9c6ee89..b2fd43c178c 100644
--- a/src/Interpreters/loadMetadata.cpp
+++ b/src/Interpreters/loadMetadata.cpp
@@ -1,3 +1,4 @@
+#include <Common/thread_local_rng.h>
 #include <Common/ThreadPool.h>
 #include <Common/PoolId.h>
 
diff --git a/src/Interpreters/removeOnClusterClauseIfNeeded.cpp b/src/Interpreters/removeOnClusterClauseIfNeeded.cpp
index 7dc452a0fcb..f8df03ed830 100644
--- a/src/Interpreters/removeOnClusterClauseIfNeeded.cpp
+++ b/src/Interpreters/removeOnClusterClauseIfNeeded.cpp
@@ -3,7 +3,7 @@
 #include <Access/AccessControl.h>
 #include <Access/ReplicatedAccessStorage.h>
 #include <Common/logger_useful.h>
-#include <Functions/UserDefined/IUserDefinedSQLObjectsLoader.h>
+#include <Functions/UserDefined/IUserDefinedSQLObjectsStorage.h>
 #include <Interpreters/Context.h>
 #include <Parsers/ASTCreateFunctionQuery.h>
 #include <Parsers/ASTDropFunctionQuery.h>
@@ -14,6 +14,7 @@
 #include <Parsers/Access/ASTCreateSettingsProfileQuery.h>
 #include <Parsers/Access/ASTCreateUserQuery.h>
 #include <Parsers/Access/ASTDropAccessEntityQuery.h>
+#include <Parsers/Access/ASTGrantQuery.h>
 
 
 namespace DB
@@ -33,7 +34,8 @@ static bool isAccessControlQuery(const ASTPtr & query)
         || query->as<ASTCreateRoleQuery>()
         || query->as<ASTCreateRowPolicyQuery>()
         || query->as<ASTCreateSettingsProfileQuery>()
-        || query->as<ASTDropAccessEntityQuery>();
+        || query->as<ASTDropAccessEntityQuery>()
+        || query->as<ASTGrantQuery>();
 }
 
 ASTPtr removeOnClusterClauseIfNeeded(const ASTPtr & query, ContextPtr context, const WithoutOnClusterASTRewriteParams & params)
@@ -45,7 +47,7 @@ ASTPtr removeOnClusterClauseIfNeeded(const ASTPtr & query, ContextPtr context, c
 
     if ((isUserDefinedFunctionQuery(query)
          && context->getSettings().ignore_on_cluster_for_replicated_udf_queries
-         && context->getUserDefinedSQLObjectsLoader().isReplicated())
+         && context->getUserDefinedSQLObjectsStorage().isReplicated())
         || (isAccessControlQuery(query)
             && context->getSettings().ignore_on_cluster_for_replicated_access_entities_queries
             && context->getAccessControl().containsStorage(ReplicatedAccessStorage::STORAGE_TYPE)))
diff --git a/src/Interpreters/tests/gtest_lru_file_cache.cpp b/src/Interpreters/tests/gtest_filecache.cpp
similarity index 74%
rename from src/Interpreters/tests/gtest_lru_file_cache.cpp
rename to src/Interpreters/tests/gtest_filecache.cpp
index c7f8fc7c8e8..1005e6090b8 100644
--- a/src/Interpreters/tests/gtest_lru_file_cache.cpp
+++ b/src/Interpreters/tests/gtest_filecache.cpp
@@ -19,6 +19,7 @@
 #include <Interpreters/Cache/FileCache.h>
 #include <Interpreters/Cache/FileCacheSettings.h>
 #include <Interpreters/Cache/FileSegment.h>
+#include <Interpreters/Cache/SLRUFileCachePriority.h>
 #include <Interpreters/Context.h>
 #include <Interpreters/TemporaryDataOnDisk.h>
 #include <base/hex.h>
@@ -83,18 +84,19 @@ using HolderPtr = FileSegmentsHolderPtr;
 
 fs::path caches_dir = fs::current_path() / "lru_cache_test";
 std::string cache_base_path = caches_dir / "cache1" / "";
+std::string cache_base_path2 = caches_dir / "cache2" / "";
 
 
-void assertEqual(FileSegments::const_iterator segments_begin, FileSegments::const_iterator segments_end, size_t segments_size, const Ranges & expected_ranges, const States & expected_states = {})
+void assertEqual(const FileSegmentsHolderPtr & file_segments, const Ranges & expected_ranges, const States & expected_states = {})
 {
-    std::cerr << "File segments: ";
-    for (auto it = segments_begin; it != segments_end; ++it)
-        std::cerr << (*it)->range().toString() << ", ";
+    std::cerr << "\nFile segments: ";
+    for (const auto & file_segment : *file_segments)
+        std::cerr << file_segment->range().toString() << ", ";
 
-    ASSERT_EQ(segments_size, expected_ranges.size());
+    ASSERT_EQ(file_segments->size(), expected_ranges.size());
 
     if (!expected_states.empty())
-        ASSERT_EQ(segments_size, expected_states.size());
+        ASSERT_EQ(file_segments->size(), expected_states.size());
 
     auto get_expected_state = [&](size_t i)
     {
@@ -105,23 +107,86 @@ void assertEqual(FileSegments::const_iterator segments_begin, FileSegments::cons
     };
 
     size_t i = 0;
-    for (auto it = segments_begin; it != segments_end; ++it)
+    for (const auto & file_segment : *file_segments)
     {
-        const auto & file_segment = *it;
         ASSERT_EQ(file_segment->range(), expected_ranges[i]);
         ASSERT_EQ(file_segment->state(), get_expected_state(i));
         ++i;
     }
 }
 
-void assertEqual(const FileSegments & file_segments, const Ranges & expected_ranges, const States & expected_states = {})
+void assertEqual(const std::vector<FileSegment::Info> & file_segments, const Ranges & expected_ranges, const States & expected_states = {})
 {
-    assertEqual(file_segments.begin(), file_segments.end(), file_segments.size(), expected_ranges, expected_states);
+    std::cerr << "\nFile segments: ";
+    for (const auto & file_segment : file_segments)
+        std::cerr << FileSegment::Range(file_segment.range_left, file_segment.range_right).toString() << ", ";
+    std::cerr << "\nExpected: ";
+    for (const auto & r : expected_ranges)
+        std::cerr << r.toString() << ", ";
+
+    ASSERT_EQ(file_segments.size(), expected_ranges.size());
+
+    if (!expected_states.empty())
+        ASSERT_EQ(file_segments.size(), expected_states.size());
+
+    auto get_expected_state = [&](size_t i)
+    {
+        if (expected_states.empty())
+            return State::DOWNLOADED;
+        else
+            return expected_states[i];
+    };
+
+    size_t i = 0;
+    for (const auto & file_segment : file_segments)
+    {
+        ASSERT_EQ(FileSegment::Range(file_segment.range_left, file_segment.range_right), expected_ranges[i]);
+        ASSERT_EQ(file_segment.state, get_expected_state(i));
+        ++i;
+    }
 }
 
-void assertEqual(const FileSegmentsHolderPtr & file_segments, const Ranges & expected_ranges, const States & expected_states = {})
+void assertProtectedOrProbationary(const std::vector<FileSegmentInfo> & file_segments, const Ranges & expected, bool assert_protected)
 {
-    assertEqual(file_segments->begin(), file_segments->end(), file_segments->size(), expected_ranges, expected_states);
+    std::cerr << "\nFile segments: ";
+    std::vector<Range> res;
+    for (const auto & f : file_segments)
+    {
+        auto range = FileSegment::Range(f.range_left, f.range_right);
+        bool is_protected = (f.queue_entry_type == FileCacheQueueEntryType::SLRU_Protected);
+        bool is_probationary = (f.queue_entry_type == FileCacheQueueEntryType::SLRU_Probationary);
+        ASSERT_TRUE(is_probationary || is_protected);
+
+        std::cerr << fmt::format("{} (protected: {})", range.toString(), is_protected) <<  ", ";
+
+        if ((is_protected && assert_protected) || (!is_protected && !assert_protected))
+        {
+            res.push_back(range);
+        }
+    }
+    std::cerr << "\nExpected: ";
+    for (const auto & range : expected)
+    {
+        std::cerr << range.toString() << ", ";
+    }
+
+    ASSERT_EQ(res.size(), expected.size());
+    for (size_t i = 0; i < res.size(); ++i)
+    {
+        ASSERT_EQ(res[i], expected[i]);
+    }
+}
+
+void assertProtected(const std::vector<FileSegmentInfo> & file_segments, const Ranges & expected)
+{
+    std::cerr << "\nAssert protected";
+    assertProtectedOrProbationary(file_segments, expected, true);
+}
+
+void assertProbationary(const std::vector<FileSegmentInfo> & file_segments, const Ranges & expected)
+{
+    std::cerr << "\nAssert probationary";
+    assertProtectedOrProbationary(file_segments, expected, false);
 }
 
 FileSegment & get(const HolderPtr & holder, int i)
@@ -134,7 +199,7 @@ FileSegment & get(const HolderPtr & holder, int i)
 
 void download(FileSegment & file_segment)
 {
-    std::cerr << "Downloading range " << file_segment.range().toString() << "\n";
+    std::cerr << "\nDownloading range " << file_segment.range().toString() << "\n";
 
     ASSERT_EQ(file_segment.getOrSetDownloader(), FileSegment::getCallerId());
     ASSERT_EQ(file_segment.state(), State::DOWNLOADING);
@@ -167,7 +232,14 @@ void download(const HolderPtr & holder)
 void increasePriority(const HolderPtr & holder)
 {
     for (auto & it : *holder)
-        it->use();
+        it->increasePriority();
+}
+
+void increasePriority(const HolderPtr & holder, size_t pos)
+{
+    FileSegments::iterator it = holder->begin();
+    std::advance(it, pos);
+    (*it)->increasePriority();
 }
 
 class FileCacheTest : public ::testing::Test
@@ -204,7 +276,10 @@ public:
 
         if (fs::exists(cache_base_path))
             fs::remove_all(cache_base_path);
+        if (fs::exists(cache_base_path2))
+            fs::remove_all(cache_base_path2);
         fs::create_directories(cache_base_path);
+        fs::create_directories(cache_base_path2);
     }
 
     void TearDown() override
@@ -216,7 +291,7 @@ public:
     pcg64 rng;
 };
 
-TEST_F(FileCacheTest, get)
+TEST_F(FileCacheTest, LRUPolicy)
 {
     DB::ThreadStatus thread_status;
 
@@ -261,7 +336,7 @@ TEST_F(FileCacheTest, get)
         /// Current cache:    [__________]
         ///                   ^          ^
         ///                   0          9
-        assertEqual(cache.getSnapshot(key), { Range(0, 9) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9) });
         assertEqual(cache.dumpQueue(), { Range(0, 9) });
         ASSERT_EQ(cache.getFileSegmentsNum(), 1);
         ASSERT_EQ(cache.getUsedCacheSize(), 10);
@@ -280,7 +355,7 @@ TEST_F(FileCacheTest, get)
         /// Current cache:    [__________][_____]
         ///                   ^          ^^     ^
         ///                   0          910    14
-        assertEqual(cache.getSnapshot(key), { Range(0, 9), Range(10, 14) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9), Range(10, 14) });
         assertEqual(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
         ASSERT_EQ(cache.getFileSegmentsNum(), 2);
         ASSERT_EQ(cache.getUsedCacheSize(), 15);
@@ -305,7 +380,7 @@ TEST_F(FileCacheTest, get)
             increasePriority(holder);
         }
 
-        assertEqual(cache.getSnapshot(key), { Range(0, 9), Range(10, 14) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9), Range(10, 14) });
         assertEqual(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
         ASSERT_EQ(cache.getFileSegmentsNum(), 2);
         ASSERT_EQ(cache.getUsedCacheSize(), 15);
@@ -334,7 +409,7 @@ TEST_F(FileCacheTest, get)
         ///                   ^          ^^     ^   ^    ^    ^   ^^^
         ///                   0          910    14  17   20   24  2627
         ///
-        assertEqual(cache.getSnapshot(key), { Range(0, 9), Range(10, 14), Range(17, 20), Range(24, 26), Range(27, 27) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9), Range(10, 14), Range(17, 20), Range(24, 26), Range(27, 27) });
         assertEqual(cache.dumpQueue(), { Range(0, 9), Range(10, 14), Range(17, 20), Range(24, 26), Range(27, 27) });
         ASSERT_EQ(cache.getFileSegmentsNum(), 5);
         ASSERT_EQ(cache.getUsedCacheSize(), 23);
@@ -377,7 +452,7 @@ TEST_F(FileCacheTest, get)
         ///                   ^                            ^    ^
         ///                   0                            20   24
         ///
-        assertEqual(cache.getSnapshot(key), { Range(0, 9), Range(10, 14), Range(15, 16), Range(17, 20), Range(24, 26) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9), Range(10, 14), Range(15, 16), Range(17, 20), Range(24, 26) });
         assertEqual(cache.dumpQueue(), { Range(0, 9), Range(10, 14), Range(15, 16), Range(17, 20), Range(24, 26) });
         ASSERT_EQ(cache.getFileSegmentsNum(), 5);
         ASSERT_EQ(cache.getUsedCacheSize(), 24);
@@ -399,7 +474,7 @@ TEST_F(FileCacheTest, get)
         /// Current cache:    [_____][__][____][_]   [___]
         ///                   ^          ^       ^   ^   ^
         ///                   10         17      21  24  26
-        assertEqual(cache.getSnapshot(key), { Range(10, 14), Range(15, 16), Range(17, 20), Range(21, 21), Range(24, 26) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(10, 14), Range(15, 16), Range(17, 20), Range(21, 21), Range(24, 26) });
         assertEqual(cache.dumpQueue(), { Range(24, 26), Range(10, 14), Range(15, 16), Range(17, 20), Range(21, 21) });
         ASSERT_EQ(cache.getFileSegmentsNum(), 5);
         ASSERT_EQ(cache.getUsedCacheSize(), 15);
@@ -418,7 +493,7 @@ TEST_F(FileCacheTest, get)
         /// Current cache:    [____][_]  [][___][__]
         ///                   ^       ^  ^^^   ^^  ^
         ///                   17      21 2324  26  27
-        assertEqual(cache.getSnapshot(key), { Range(17, 20), Range(21, 21), Range(23, 23), Range(24, 26), Range(27, 27) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(17, 20), Range(21, 21), Range(23, 23), Range(24, 26), Range(27, 27) });
         assertEqual(cache.dumpQueue(), { Range(17, 20), Range(21, 21), Range(23, 23), Range(24, 26), Range(27, 27) });
         ASSERT_EQ(cache.getFileSegmentsNum(), 5);
         ASSERT_EQ(cache.getUsedCacheSize(), 10);
@@ -464,7 +539,7 @@ TEST_F(FileCacheTest, get)
         /// Current cache:    [___]       [_][___][_]   [__]
         ///                   ^   ^       ^  ^   ^  ^   ^  ^
         ///                   2   4       23 24  26 27  30 31
-        assertEqual(cache.getSnapshot(key), { Range(2, 4), Range(23, 23), Range(24, 26), Range(27, 27), Range(30, 31) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(2, 4), Range(23, 23), Range(24, 26), Range(27, 27), Range(30, 31) });
         assertEqual(cache.dumpQueue(), { Range(2, 4), Range(23, 23), Range(24, 26), Range(27, 27), Range(30, 31) });
 
         std::cerr << "Step 9\n";
@@ -535,7 +610,7 @@ TEST_F(FileCacheTest, get)
         /// Current cache:    [___]       [___][_][__][__]
         ///                   ^   ^       ^   ^  ^^  ^^  ^
         ///                   2   4       24  26 27  2930 31
-        assertEqual(cache.getSnapshot(key), { Range(2, 4), Range(24, 26), Range(27, 27), Range(28, 29), Range(30, 31) });
+        assertEqual(cache.getFileSegmentInfos(key), { Range(2, 4), Range(24, 26), Range(27, 27), Range(28, 29), Range(30, 31) });
         assertEqual(cache.dumpQueue(), { Range(30, 31), Range(2, 4), Range(24, 26), Range(27, 27), Range(28, 29) });
 
         std::cerr << "Step 10\n";
@@ -1040,3 +1115,206 @@ TEST_F(FileCacheTest, TemporaryDataReadBufferSize)
         ASSERT_EQ(stream.getSize(), 62);
     }
 }
+
+TEST_F(FileCacheTest, SLRUPolicy)
+{
+    DB::ThreadStatus thread_status;
+    std::string query_id = "query_id"; /// To work with cache need query_id and query context.
+
+    Poco::XML::DOMParser dom_parser;
+    std::string xml(R"CONFIG(<clickhouse>
+</clickhouse>)CONFIG");
+    Poco::AutoPtr<Poco::XML::Document> document = dom_parser.parseString(xml);
+    Poco::AutoPtr<Poco::Util::XMLConfiguration> config = new Poco::Util::XMLConfiguration(document);
+    getMutableContext().context->setConfig(config);
+
+    auto query_context = DB::Context::createCopy(getContext().context);
+    query_context->makeQueryContext();
+    query_context->setCurrentQueryId(query_id);
+    chassert(&DB::CurrentThread::get() == &thread_status);
+    DB::CurrentThread::QueryScope query_scope_holder(query_context);
+
+    DB::FileCacheSettings settings;
+    settings.base_path = cache_base_path;
+    settings.max_size = 40;
+    settings.max_elements = 6;
+    settings.boundary_alignment = 1;
+
+    settings.cache_policy = "SLRU";
+    settings.slru_size_ratio = 0.5;
+
+    const size_t file_size = -1; // the value doesn't really matter because boundary_alignment == 1.
+    size_t file_cache_name = 0;
+
+    {
+        auto cache = DB::FileCache(std::to_string(++file_cache_name), settings);
+        cache.initialize();
+        auto key = cache.createKeyForPath("key1");
+
+        auto add_range = [&](size_t offset, size_t size)
+        {
+            std::cerr << "Add [" << offset << ", " << offset + size - 1 << "]" << std::endl;
+
+            auto holder = cache.getOrSet(key, offset, size, file_size, {});
+            assertEqual(holder, { Range(offset, offset + size - 1) }, { State::EMPTY });
+            download(holder->front());
+            assertEqual(holder, { Range(offset, offset + size - 1) }, { State::DOWNLOADED });
+        };
+
+        auto check_covering_range = [&](size_t offset, size_t size, Ranges covering_ranges)
+        {
+            auto holder = cache.getOrSet(key, offset, size, file_size, {});
+            std::vector<State> states(covering_ranges.size(), State::DOWNLOADED);
+            assertEqual(holder, covering_ranges, states);
+            increasePriority(holder);
+        };
+
+        add_range(0, 10);
+        add_range(10, 5);
+
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9), Range(10, 14) });
+        assertEqual(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
+
+        ASSERT_EQ(cache.getFileSegmentsNum(), 2);
+        ASSERT_EQ(cache.getUsedCacheSize(), 15);
+
+        assertProbationary(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
+        assertProtected(cache.dumpQueue(), Ranges{});
+
+        check_covering_range(9, 1, { Range(0, 9) });
+        assertEqual(cache.dumpQueue(), { Range(10, 14), Range(0, 9) });
+
+        check_covering_range(10, 1, { Range(10, 14) });
+        assertEqual(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
+
+        assertProbationary(cache.dumpQueue(), Ranges{});
+        assertProtected(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
+
+        add_range(17, 4);
+        assertEqual(cache.dumpQueue(), { Range(17, 20), Range(0, 9), Range(10, 14) });
+
+        add_range(24, 3);
+        assertEqual(cache.dumpQueue(), { Range(17, 20), Range(24, 26), Range(0, 9), Range(10, 14) });
+
+        add_range(27, 1);
+        assertEqual(cache.dumpQueue(), { Range(17, 20), Range(24, 26), Range(27, 27), Range(0, 9), Range(10, 14) });
+
+        assertProbationary(cache.dumpQueue(), { Range(17, 20), Range(24, 26), Range(27, 27) });
+        assertProtected(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
+
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9), Range(10, 14), Range(17, 20), Range(24, 26), Range(27, 27) });
+        ASSERT_EQ(cache.getFileSegmentsNum(), 5);
+        ASSERT_EQ(cache.getUsedCacheSize(), 23);
+
+        add_range(28, 3);
+        assertEqual(cache.dumpQueue(), { Range(24, 26), Range(27, 27), Range(28, 30), Range(0, 9), Range(10, 14) });
+
+        assertProbationary(cache.dumpQueue(), { Range(24, 26), Range(27, 27), Range(28, 30) });
+        assertProtected(cache.dumpQueue(), { Range(0, 9), Range(10, 14) });
+
+        check_covering_range(4, 1, { Range(0, 9) });
+
+        assertProbationary(cache.dumpQueue(), { Range(24, 26), Range(27, 27), Range(28, 30) });
+        assertProtected(cache.dumpQueue(), { Range(10, 14), Range(0, 9) });
+
+        check_covering_range(27, 3, { Range(27, 27), Range(28, 30) });
+
+        assertProbationary(cache.dumpQueue(), { Range(24, 26), Range(10, 14) });
+        assertProtected(cache.dumpQueue(), { Range(0, 9), Range(27, 27), Range(28, 30) });
+
+        assertEqual(cache.getFileSegmentInfos(key), { Range(0, 9), Range(10, 14), Range(24, 26), Range(27, 27), Range(28, 30) });
+        ASSERT_EQ(cache.getFileSegmentsNum(), 5);
+        ASSERT_EQ(cache.getUsedCacheSize(), 22);
+    }
+
+    {
+        ReadSettings read_settings;
+        read_settings.enable_filesystem_cache = true;
+        read_settings.local_fs_method = LocalFSReadMethod::pread;
+
+        auto write_file = [](const std::string & filename, const std::string & s)
+        {
+            std::string file_path = fs::current_path() / filename;
+            auto wb = std::make_unique<WriteBufferFromFile>(file_path, DBMS_DEFAULT_BUFFER_SIZE);
+            wb->write(s.data(), s.size());
+            wb->next();
+            wb->finalize();
+            return file_path;
+        };
+
+        DB::FileCacheSettings settings2;
+        settings2.base_path = cache_base_path2;
+        settings2.max_file_segment_size = 5;
+        settings2.max_size = 30;
+        settings2.max_elements = 6;
+        settings2.boundary_alignment = 1;
+        settings2.cache_policy = "SLRU";
+        settings2.slru_size_ratio = 0.5;
+
+        auto cache = std::make_shared<DB::FileCache>("slru_2", settings2);
+        cache->initialize();
+
+        auto read_and_check = [&](const std::string & file, const FileCacheKey & key, const std::string & expect_result)
+        {
+            auto read_buffer_creator = [&]()
+            {
+                return createReadBufferFromFileBase(file, read_settings, std::nullopt, std::nullopt);
+            };
+
+            auto cached_buffer = std::make_shared<CachedOnDiskReadBufferFromFile>(
+                file, key, cache, read_buffer_creator, read_settings, "test", expect_result.size(), false, false, std::nullopt, nullptr);
+
+            WriteBufferFromOwnString result;
+            copyData(*cached_buffer, result);
+            ASSERT_EQ(result.str(), expect_result);
+        };
+
+        std::string data1(15, '*');
+        auto file1 = write_file("test1", data1);
+        auto key1 = cache->createKeyForPath(file1);
+
+        read_and_check(file1, key1, data1);
+
+        assertEqual(cache->dumpQueue(), { Range(0, 4), Range(5, 9), Range(10, 14) });
+        assertProbationary(cache->dumpQueue(), { Range(0, 4), Range(5, 9), Range(10, 14) });
+        assertProtected(cache->dumpQueue(), Ranges{});
+
+        read_and_check(file1, key1, data1);
+
+        assertEqual(cache->dumpQueue(), { Range(0, 4), Range(5, 9), Range(10, 14) });
+        assertProbationary(cache->dumpQueue(), Ranges{});
+        assertProtected(cache->dumpQueue(), { Range(0, 4), Range(5, 9), Range(10, 14) });
+
+        std::string data2(10, '*');
+        auto file2 = write_file("test2", data2);
+        auto key2 = cache->createKeyForPath(file2);
+
+        read_and_check(file2, key2, data2);
+
+        auto dump = cache->dumpQueue();
+        assertEqual(dump, { Range(0, 4), Range(5, 9), Range(0, 4), Range(5, 9), Range(10, 14) });
+
+        ASSERT_EQ(dump[0].key, key2);
+        ASSERT_EQ(dump[1].key, key2);
+        ASSERT_EQ(dump[2].key, key1);
+        ASSERT_EQ(dump[3].key, key1);
+        ASSERT_EQ(dump[4].key, key1);
+
+        assertProbationary(cache->dumpQueue(), { Range(0, 4), Range(5, 9) });
+        assertProtected(cache->dumpQueue(), { Range(0, 4), Range(5, 9), Range(10, 14) });
+
+        read_and_check(file2, key2, data2);
+
+        dump = cache->dumpQueue();
+        assertEqual(dump, { Range(0, 4), Range(5, 9), Range(10, 14), Range(0, 4), Range(5, 9)  });
+
+        ASSERT_EQ(dump[0].key, key1);
+        ASSERT_EQ(dump[1].key, key1);
+        ASSERT_EQ(dump[2].key, key1);
+        ASSERT_EQ(dump[3].key, key2);
+        ASSERT_EQ(dump[4].key, key2);
+
+        assertProbationary(cache->dumpQueue(), { Range(0, 4), Range(5, 9) });
+        assertProtected(cache->dumpQueue(), { Range(10, 14), Range(0, 4), Range(5, 9)  });
+    }
+}
diff --git a/src/Loggers/ExtendedLogChannel.cpp b/src/Loggers/ExtendedLogChannel.cpp
index 116892b9030..634ae489dc1 100644
--- a/src/Loggers/ExtendedLogChannel.cpp
+++ b/src/Loggers/ExtendedLogChannel.cpp
@@ -19,7 +19,7 @@ ExtendedLogMessage ExtendedLogMessage::getFrom(const Poco::Message & base)
 
     ::timeval tv;
     if (0 != gettimeofday(&tv, nullptr))
-        DB::throwFromErrno("Cannot gettimeofday", ErrorCodes::CANNOT_GETTIMEOFDAY);
+        throw ErrnoException(ErrorCodes::CANNOT_GETTIMEOFDAY, "Cannot gettimeofday");
 
     msg_ext.time_seconds = static_cast<UInt32>(tv.tv_sec);
     msg_ext.time_microseconds = static_cast<UInt32>(tv.tv_usec);
diff --git a/src/Parsers/ASTAlterQuery.cpp b/src/Parsers/ASTAlterQuery.cpp
index 84893011222..84355817b2c 100644
--- a/src/Parsers/ASTAlterQuery.cpp
+++ b/src/Parsers/ASTAlterQuery.cpp
@@ -453,6 +453,12 @@ void ASTAlterCommand::formatImpl(const FormatSettings & settings, FormatState &
                       << (settings.hilite ? hilite_none : "");
         select->formatImpl(settings, state, frame);
     }
+    else if (type == ASTAlterCommand::MODIFY_REFRESH)
+    {
+        settings.ostr << (settings.hilite ? hilite_keyword : "") << "MODIFY REFRESH " << settings.nl_or_ws
+                      << (settings.hilite ? hilite_none : "");
+        refresh->formatImpl(settings, state, frame);
+    }
     else if (type == ASTAlterCommand::LIVE_VIEW_REFRESH)
     {
         settings.ostr << (settings.hilite ? hilite_keyword : "") << "REFRESH " << (settings.hilite ? hilite_none : "");
@@ -466,6 +472,16 @@ void ASTAlterCommand::formatImpl(const FormatSettings & settings, FormatState &
         settings.ostr << (settings.hilite ? hilite_keyword : "") << " TO ";
         rename_to->formatImpl(settings, state, frame);
     }
+    else if (type == ASTAlterCommand::APPLY_DELETED_MASK)
+    {
+        settings.ostr << (settings.hilite ? hilite_keyword : "") << "APPLY DELETED MASK" << (settings.hilite ? hilite_none : "");
+
+        if (partition)
+        {
+            settings.ostr << (settings.hilite ? hilite_keyword : "") << " IN PARTITION " << (settings.hilite ? hilite_none : "");
+            partition->formatImpl(settings, state, frame);
+        }
+    }
     else
         throw Exception(ErrorCodes::UNEXPECTED_AST_STRUCTURE, "Unexpected type of ALTER");
 }
diff --git a/src/Parsers/ASTAlterQuery.h b/src/Parsers/ASTAlterQuery.h
index e601739595f..0b115537a6d 100644
--- a/src/Parsers/ASTAlterQuery.h
+++ b/src/Parsers/ASTAlterQuery.h
@@ -40,6 +40,7 @@ public:
         MODIFY_SETTING,
         RESET_SETTING,
         MODIFY_QUERY,
+        MODIFY_REFRESH,
         REMOVE_TTL,
         REMOVE_SAMPLE_BY,
 
@@ -71,6 +72,7 @@ public:
 
         DELETE,
         UPDATE,
+        APPLY_DELETED_MASK,
 
         NO_TYPE,
 
@@ -165,6 +167,9 @@ public:
      */
     ASTPtr values;
 
+    /// For MODIFY REFRESH
+    ASTPtr refresh;
+
     bool detach = false;        /// true for DETACH PARTITION
 
     bool part = false;          /// true for ATTACH PART, DROP DETACHED PART and MOVE
diff --git a/src/Parsers/ASTCreateQuery.cpp b/src/Parsers/ASTCreateQuery.cpp
index 1562586bd93..9d5f0bcddbd 100644
--- a/src/Parsers/ASTCreateQuery.cpp
+++ b/src/Parsers/ASTCreateQuery.cpp
@@ -2,7 +2,6 @@
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTSelectWithUnionQuery.h>
-#include <Parsers/ASTSetQuery.h>
 #include <Common/quoteString.h>
 #include <Interpreters/StorageID.h>
 #include <IO/Operators.h>
@@ -340,6 +339,12 @@ void ASTCreateQuery::formatQueryImpl(const FormatSettings & settings, FormatStat
         formatOnCluster(settings);
     }
 
+    if (refresh_strategy)
+    {
+        settings.ostr << settings.nl_or_ws;
+        refresh_strategy->formatImpl(settings, state, frame);
+    }
+
     if (to_table_id)
     {
         assert((is_materialized_view || is_window_view) && to_inner_uuid == UUIDHelpers::Nil);
diff --git a/src/Parsers/ASTCreateQuery.h b/src/Parsers/ASTCreateQuery.h
index 28f5e05802b..49a0140625c 100644
--- a/src/Parsers/ASTCreateQuery.h
+++ b/src/Parsers/ASTCreateQuery.h
@@ -5,6 +5,7 @@
 #include <Parsers/ASTDictionary.h>
 #include <Parsers/ASTDictionaryAttributeDeclaration.h>
 #include <Parsers/ASTTableOverrides.h>
+#include <Parsers/ASTRefreshStrategy.h>
 #include <Interpreters/StorageID.h>
 
 namespace DB
@@ -116,6 +117,7 @@ public:
     ASTExpressionList * dictionary_attributes_list = nullptr; /// attributes of
     ASTDictionary * dictionary = nullptr; /// dictionary definition (layout, primary key, etc.)
 
+    ASTRefreshStrategy * refresh_strategy = nullptr; // For CREATE MATERIALIZED VIEW ... REFRESH ...
     std::optional<UInt64> live_view_periodic_refresh;    /// For CREATE LIVE VIEW ... WITH [PERIODIC] REFRESH ...
 
     bool is_watermark_strictly_ascending{false}; /// STRICTLY ASCENDING WATERMARK STRATEGY FOR WINDOW VIEW
diff --git a/src/Parsers/ASTRefreshStrategy.cpp b/src/Parsers/ASTRefreshStrategy.cpp
new file mode 100644
index 00000000000..2e0c6ee4638
--- /dev/null
+++ b/src/Parsers/ASTRefreshStrategy.cpp
@@ -0,0 +1,71 @@
+#include <Parsers/ASTRefreshStrategy.h>
+
+#include <IO/Operators.h>
+
+namespace DB
+{
+
+ASTPtr ASTRefreshStrategy::clone() const
+{
+    auto res = std::make_shared<ASTRefreshStrategy>(*this);
+    res->children.clear();
+
+    if (period)
+        res->set(res->period, period->clone());
+    if (offset)
+        res->set(res->offset, offset->clone());
+    if (spread)
+        res->set(res->spread, spread->clone());
+    if (settings)
+        res->set(res->settings, settings->clone());
+    if (dependencies)
+        res->set(res->dependencies, dependencies->clone());
+    res->schedule_kind = schedule_kind;
+    return res;
+}
+
+void ASTRefreshStrategy::formatImpl(
+    const IAST::FormatSettings & f_settings, IAST::FormatState & state, IAST::FormatStateStacked frame) const
+{
+    frame.need_parens = false;
+
+    f_settings.ostr << (f_settings.hilite ? hilite_keyword : "") << "REFRESH " << (f_settings.hilite ? hilite_none : "");
+    using enum RefreshScheduleKind;
+    switch (schedule_kind)
+    {
+        case AFTER:
+            f_settings.ostr << "AFTER " << (f_settings.hilite ? hilite_none : "");
+            period->formatImpl(f_settings, state, frame);
+            break;
+        case EVERY:
+            f_settings.ostr << "EVERY " << (f_settings.hilite ? hilite_none : "");
+            period->formatImpl(f_settings, state, frame);
+            if (offset)
+            {
+                f_settings.ostr << (f_settings.hilite ? hilite_keyword : "") << " OFFSET " << (f_settings.hilite ? hilite_none : "");
+                offset->formatImpl(f_settings, state, frame);
+            }
+            break;
+        default:
+            f_settings.ostr << (f_settings.hilite ? hilite_none : "");
+            break;
+    }
+
+    if (spread)
+    {
+        f_settings.ostr << (f_settings.hilite ? hilite_keyword : "") << " RANDOMIZE FOR " << (f_settings.hilite ? hilite_none : "");
+        spread->formatImpl(f_settings, state, frame);
+    }
+    if (dependencies)
+    {
+        f_settings.ostr << (f_settings.hilite ? hilite_keyword : "") << " DEPENDS ON " << (f_settings.hilite ? hilite_none : "");
+        dependencies->formatImpl(f_settings, state, frame);
+    }
+    if (settings)
+    {
+        f_settings.ostr << (f_settings.hilite ? hilite_keyword : "") << " SETTINGS " << (f_settings.hilite ? hilite_none : "");
+        settings->formatImpl(f_settings, state, frame);
+    }
+}
+
+}
diff --git a/src/Parsers/ASTRefreshStrategy.h b/src/Parsers/ASTRefreshStrategy.h
new file mode 100644
index 00000000000..ca248b76b40
--- /dev/null
+++ b/src/Parsers/ASTRefreshStrategy.h
@@ -0,0 +1,35 @@
+#pragma once
+
+#include <Parsers/ASTSetQuery.h>
+#include <Parsers/ASTExpressionList.h>
+#include <Parsers/ASTTimeInterval.h>
+
+namespace DB
+{
+
+enum class RefreshScheduleKind : UInt8
+{
+    UNKNOWN = 0,
+    AFTER,
+    EVERY
+};
+
+/// Strategy for MATERIALIZED VIEW ... REFRESH ..
+class ASTRefreshStrategy : public IAST
+{
+public:
+    ASTSetQuery * settings = nullptr;
+    ASTExpressionList * dependencies = nullptr;
+    ASTTimeInterval * period = nullptr;
+    ASTTimeInterval * offset = nullptr;
+    ASTTimeInterval * spread = nullptr;
+    RefreshScheduleKind schedule_kind{RefreshScheduleKind::UNKNOWN};
+
+    String getID(char) const override { return "Refresh strategy definition"; }
+
+    ASTPtr clone() const override;
+
+    void formatImpl(const FormatSettings & s, FormatState & state, FormatStateStacked frame) const override;
+};
+
+}
diff --git a/src/Parsers/ASTSelectQuery.cpp b/src/Parsers/ASTSelectQuery.cpp
index 7c96db006c4..2115de1c124 100644
--- a/src/Parsers/ASTSelectQuery.cpp
+++ b/src/Parsers/ASTSelectQuery.cpp
@@ -144,7 +144,7 @@ void ASTSelectQuery::formatImpl(const FormatSettings & s, FormatState & state, F
         window()->as<ASTExpressionList &>().formatImplMultiline(s, state, frame);
     }
 
-    if (orderBy())
+    if (!order_by_all && orderBy())
     {
         s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "ORDER BY" << (s.hilite ? hilite_none : "");
         s.one_line
@@ -163,6 +163,24 @@ void ASTSelectQuery::formatImpl(const FormatSettings & s, FormatState & state, F
         }
     }
 
+    if (order_by_all)
+    {
+        s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "ORDER BY ALL" << (s.hilite ? hilite_none : "");
+
+        auto * elem = orderBy()->children[0]->as<ASTOrderByElement>();
+        s.ostr << (s.hilite ? hilite_keyword : "")
+               << (elem->direction == -1 ? " DESC" : " ASC")
+               << (s.hilite ? hilite_none : "");
+
+        if (elem->nulls_direction_was_explicitly_specified)
+        {
+            s.ostr << (s.hilite ? hilite_keyword : "")
+                   << " NULLS "
+                   << (elem->nulls_direction == elem->direction ? "LAST" : "FIRST")
+                   << (s.hilite ? hilite_none : "");
+        }
+    }
+
     if (limitByLength())
     {
         s.ostr << (s.hilite ? hilite_keyword : "") << s.nl_or_ws << indent_str << "LIMIT " << (s.hilite ? hilite_none : "");
diff --git a/src/Parsers/ASTSelectQuery.h b/src/Parsers/ASTSelectQuery.h
index 57f45a8aacd..eb171dc00ee 100644
--- a/src/Parsers/ASTSelectQuery.h
+++ b/src/Parsers/ASTSelectQuery.h
@@ -87,6 +87,7 @@ public:
     bool group_by_with_cube = false;
     bool group_by_with_constant_keys = false;
     bool group_by_with_grouping_sets = false;
+    bool order_by_all = false;
     bool limit_with_ties = false;
 
     ASTPtr & refSelect()    { return getExpression(Expression::SELECT); }
diff --git a/src/Parsers/ASTSystemQuery.cpp b/src/Parsers/ASTSystemQuery.cpp
index 77235dfb6c2..c005d49a93d 100644
--- a/src/Parsers/ASTSystemQuery.cpp
+++ b/src/Parsers/ASTSystemQuery.cpp
@@ -179,7 +179,8 @@ void ASTSystemQuery::formatImpl(const FormatSettings & settings, FormatState &,
             || type == Type::RELOAD_DICTIONARY
             || type == Type::RELOAD_MODEL
             || type == Type::RELOAD_FUNCTION
-            || type == Type::RESTART_DISK)
+            || type == Type::RESTART_DISK
+            || type == Type::DROP_DISK_METADATA_CACHE)
     {
         if (table)
         {
diff --git a/src/Parsers/ASTSystemQuery.h b/src/Parsers/ASTSystemQuery.h
index 5f7ba5be330..fc26f5dee1c 100644
--- a/src/Parsers/ASTSystemQuery.h
+++ b/src/Parsers/ASTSystemQuery.h
@@ -32,6 +32,7 @@ public:
         DROP_COMPILED_EXPRESSION_CACHE,
 #endif
         DROP_FILESYSTEM_CACHE,
+        DROP_DISK_METADATA_CACHE,
         DROP_SCHEMA_CACHE,
         DROP_FORMAT_SCHEMA_CACHE,
 #if USE_AWS_S3
@@ -49,6 +50,8 @@ public:
         SYNC_DATABASE_REPLICA,
         SYNC_TRANSACTION_LOG,
         SYNC_FILE_CACHE,
+        REPLICA_READY,
+        REPLICA_UNREADY,
         RELOAD_DICTIONARY,
         RELOAD_DICTIONARIES,
         RELOAD_MODEL,
@@ -87,6 +90,13 @@ public:
         STOP_CLEANUP,
         START_CLEANUP,
         RESET_COVERAGE,
+        REFRESH_VIEW,
+        START_VIEW,
+        START_VIEWS,
+        STOP_VIEW,
+        STOP_VIEWS,
+        CANCEL_VIEW,
+        TEST_VIEW,
         END
     };
 
@@ -130,6 +140,10 @@ public:
 
     ServerType server_type;
 
+    /// For SYSTEM TEST VIEW <name> (SET FAKE TIME <time> | UNSET FAKE TIME).
+    /// Unix time.
+    std::optional<Int64> fake_time_for_view;
+
     String getID(char) const override { return "SYSTEM query"; }
 
     ASTPtr clone() const override
diff --git a/src/Parsers/ASTTablesInSelectQuery.cpp b/src/Parsers/ASTTablesInSelectQuery.cpp
index e4e8c00879e..8ca2ee0efae 100644
--- a/src/Parsers/ASTTablesInSelectQuery.cpp
+++ b/src/Parsers/ASTTablesInSelectQuery.cpp
@@ -211,6 +211,9 @@ void ASTTableJoin::formatImplBeforeTable(const FormatSettings & settings, Format
         case JoinKind::Comma:
             settings.ostr << ",";
             break;
+        case JoinKind::Paste:
+            settings.ostr << "PASTE JOIN";
+            break;
     }
 
     settings.ostr << (settings.hilite ? hilite_none : "");
diff --git a/src/Parsers/ASTTimeInterval.cpp b/src/Parsers/ASTTimeInterval.cpp
new file mode 100644
index 00000000000..44f6e577e94
--- /dev/null
+++ b/src/Parsers/ASTTimeInterval.cpp
@@ -0,0 +1,28 @@
+#include <Parsers/ASTTimeInterval.h>
+
+#include <IO/Operators.h>
+
+#include <ranges>
+
+namespace DB
+{
+
+ASTPtr ASTTimeInterval::clone() const
+{
+    return std::make_shared<ASTTimeInterval>(*this);
+}
+
+void ASTTimeInterval::formatImpl(const FormatSettings & f_settings, FormatState &, FormatStateStacked frame) const
+{
+    frame.need_parens = false;
+
+    for (bool is_first = true; auto [kind, value] : interval.toIntervals())
+    {
+        if (!std::exchange(is_first, false))
+            f_settings.ostr << ' ';
+        f_settings.ostr << value << ' ';
+        f_settings.ostr << (f_settings.hilite ? hilite_keyword : "") << kind.toKeyword() << (f_settings.hilite ? hilite_none : "");
+    }
+}
+
+}
diff --git a/src/Parsers/ASTTimeInterval.h b/src/Parsers/ASTTimeInterval.h
new file mode 100644
index 00000000000..a68acd0f8ea
--- /dev/null
+++ b/src/Parsers/ASTTimeInterval.h
@@ -0,0 +1,24 @@
+#pragma once
+
+#include <Parsers/IAST.h>
+
+#include <Common/CalendarTimeInterval.h>
+
+#include <map>
+
+namespace DB
+{
+
+/// Compound time interval like 1 YEAR 3 DAY 15 MINUTE
+class ASTTimeInterval : public IAST
+{
+public:
+    CalendarTimeInterval interval;
+
+    String getID(char) const override { return "TimeInterval"; }
+
+    ASTPtr clone() const override;
+    void formatImpl(const FormatSettings & settings, FormatState & state, FormatStateStacked frame) const override;
+};
+
+}
diff --git a/src/Parsers/ExpressionListParsers.cpp b/src/Parsers/ExpressionListParsers.cpp
index 20ecc741a01..1e9383f96ae 100644
--- a/src/Parsers/ExpressionListParsers.cpp
+++ b/src/Parsers/ExpressionListParsers.cpp
@@ -468,7 +468,8 @@ enum class OperatorType
     StartIf,
     FinishIf,
     Cast,
-    Lambda
+    Lambda,
+    Not
 };
 
 /** Operator struct stores parameters of the operator:
@@ -2420,7 +2421,7 @@ const std::vector<std::pair<std::string_view, Operator>> ParserExpressionImpl::o
 
 const std::vector<std::pair<std::string_view, Operator>> ParserExpressionImpl::unary_operators_table
 {
-    {"NOT",           Operator("not",             5,  1)},
+    {"NOT",           Operator("not",             5,  1, OperatorType::Not)},
     {"-",             Operator("negate",          13, 1)},
     {"−",             Operator("negate",          13, 1)}
 };
@@ -2576,6 +2577,12 @@ Action ParserExpressionImpl::tryParseOperand(Layers & layers, IParser::Pos & pos
         }
     }
 
+    /// ignore all leading plus
+    while (pos->type == TokenType::Plus)
+    {
+        ++pos;
+    }
+
     /// Try to find any unary operators
     auto cur_op = unary_operators_table.begin();
     for (; cur_op != unary_operators_table.end(); ++cur_op)
@@ -2586,7 +2593,16 @@ Action ParserExpressionImpl::tryParseOperand(Layers & layers, IParser::Pos & pos
 
     if (cur_op != unary_operators_table.end())
     {
-        layers.back()->pushOperator(cur_op->second);
+        if (cur_op->second.type == OperatorType::Not && pos->type == TokenType::OpeningRoundBracket)
+        {
+            ++pos;
+            auto identifier = std::make_shared<ASTIdentifier>(cur_op->second.function_name);
+            layers.push_back(getFunctionLayer(identifier, layers.front()->is_table_function));
+        }
+        else
+        {
+            layers.back()->pushOperator(cur_op->second);
+        }
         return Action::OPERAND;
     }
 
diff --git a/src/Parsers/ParserAlterQuery.cpp b/src/Parsers/ParserAlterQuery.cpp
index 28b7a3de9f6..64df192bfda 100644
--- a/src/Parsers/ParserAlterQuery.cpp
+++ b/src/Parsers/ParserAlterQuery.cpp
@@ -5,6 +5,7 @@
 #include <Parsers/ExpressionListParsers.h>
 #include <Parsers/ParserCreateQuery.h>
 #include <Parsers/ParserPartition.h>
+#include <Parsers/ParserRefreshStrategy.h>
 #include <Parsers/ParserSelectWithUnionQuery.h>
 #include <Parsers/ParserSetQuery.h>
 #include <Parsers/ASTIdentifier.h>
@@ -38,6 +39,7 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
     ParserKeyword s_modify_setting("MODIFY SETTING");
     ParserKeyword s_reset_setting("RESET SETTING");
     ParserKeyword s_modify_query("MODIFY QUERY");
+    ParserKeyword s_modify_refresh("MODIFY REFRESH");
 
     ParserKeyword s_add_index("ADD INDEX");
     ParserKeyword s_drop_index("DROP INDEX");
@@ -111,6 +113,7 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
 
     ParserKeyword s_remove_ttl("REMOVE TTL");
     ParserKeyword s_remove_sample_by("REMOVE SAMPLE BY");
+    ParserKeyword s_apply_deleted_mask("APPLY DELETED MASK");
 
     ParserCompoundIdentifier parser_name;
     ParserStringLiteral parser_string_literal;
@@ -132,6 +135,7 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
         /* allow_empty = */ false);
     ParserNameList values_p;
     ParserSelectWithUnionQuery select_p;
+    ParserRefreshStrategy refresh_p;
     ParserTTLExpressionList parser_ttl_list;
 
     switch (alter_object)
@@ -816,6 +820,12 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
                     return false;
                 command->type = ASTAlterCommand::MODIFY_QUERY;
             }
+            else if (s_modify_refresh.ignore(pos, expected))
+            {
+                if (!refresh_p.parse(pos, command->refresh, expected))
+                    return false;
+                command->type = ASTAlterCommand::MODIFY_REFRESH;
+            }
             else if (s_modify_comment.ignore(pos, expected))
             {
                 if (!parser_string_literal.parse(pos, command->comment, expected))
@@ -823,6 +833,16 @@ bool ParserAlterCommand::parseImpl(Pos & pos, ASTPtr & node, Expected & expected
 
                 command->type = ASTAlterCommand::MODIFY_COMMENT;
             }
+            else if (s_apply_deleted_mask.ignore(pos, expected))
+            {
+                command->type = ASTAlterCommand::APPLY_DELETED_MASK;
+
+                if (s_in_partition.ignore(pos, expected))
+                {
+                    if (!parser_partition.parse(pos, command->partition, expected))
+                        return false;
+                }
+            }
             else
                 return false;
         }
diff --git a/src/Parsers/ParserCreateQuery.cpp b/src/Parsers/ParserCreateQuery.cpp
index f79850467e4..1f6f68c9d8e 100644
--- a/src/Parsers/ParserCreateQuery.cpp
+++ b/src/Parsers/ParserCreateQuery.cpp
@@ -20,6 +20,7 @@
 #include <Parsers/ParserProjectionSelectQuery.h>
 #include <Parsers/ParserSelectWithUnionQuery.h>
 #include <Parsers/ParserSetQuery.h>
+#include <Parsers/ParserRefreshStrategy.h>
 #include <Common/typeid_cast.h>
 #include <Parsers/ASTColumnDeclaration.h>
 
@@ -1390,6 +1391,7 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     ASTPtr as_database;
     ASTPtr as_table;
     ASTPtr select;
+    ASTPtr refresh_strategy;
 
     String cluster_str;
     bool attach = false;
@@ -1436,6 +1438,15 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             return false;
     }
 
+    if (ParserKeyword{"REFRESH"}.ignore(pos, expected))
+    {
+        // REFRESH only with materialized views
+        if (!is_materialized_view)
+            return false;
+        if (!ParserRefreshStrategy{}.parse(pos, refresh_strategy, expected))
+            return false;
+    }
+
     if (is_materialized_view && ParserKeyword{"TO INNER UUID"}.ignore(pos, expected))
     {
         ParserStringLiteral literal_p;
@@ -1459,34 +1470,42 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
             return false;
     }
 
-    if (is_materialized_view && !to_table)
+    if (is_materialized_view)
     {
-        /// Internal ENGINE for MATERIALIZED VIEW must be specified.
-        /// Actually check it in Interpreter as default_table_engine can be set
-        storage_p.parse(pos, storage, expected);
+        if (!to_table)
+        {
+            /// Internal ENGINE for MATERIALIZED VIEW must be specified.
+            /// Actually check it in Interpreter as default_table_engine can be set
+            storage_p.parse(pos, storage, expected);
 
-        if (s_populate.ignore(pos, expected))
-            is_populate = true;
-        else if (s_empty.ignore(pos, expected))
-            is_create_empty = true;
+            if (s_populate.ignore(pos, expected))
+                is_populate = true;
+            else if (s_empty.ignore(pos, expected))
+                is_create_empty = true;
 
-        if (ParserKeyword{"TO"}.ignore(pos, expected))
-            throw Exception(
-                ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'ENGINE' and 'TO [db].[table]'");
-    }
-    else
-    {
-        if (storage_p.ignore(pos, expected))
-            throw Exception(
-                ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'TO [db].[table]' and 'ENGINE'");
+            if (ParserKeyword{"TO"}.ignore(pos, expected))
+                throw Exception(
+                    ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'ENGINE' and 'TO [db].[table]'");
+        }
+        else
+        {
+            if (storage_p.ignore(pos, expected))
+                throw Exception(
+                    ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'TO [db].[table]' and 'ENGINE'");
 
-        if (s_populate.ignore(pos, expected))
-            throw Exception(
-                ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'TO [db].[table]' and 'POPULATE'");
+            if (s_populate.ignore(pos, expected))
+                throw Exception(
+                    ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'TO [db].[table]' and 'POPULATE'");
 
-        if (s_empty.ignore(pos, expected))
-            throw Exception(
-                ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'TO [db].[table]' and 'EMPTY'");
+            if (s_empty.ignore(pos, expected))
+            {
+                if (!refresh_strategy)
+                    throw Exception(
+                        ErrorCodes::SYNTAX_ERROR, "When creating a materialized view you can't declare both 'TO [db].[table]' and 'EMPTY'");
+
+                is_create_empty = true;
+            }
+        }
     }
 
     /// AS SELECT ...
@@ -1527,6 +1546,8 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
 
     query->set(query->columns_list, columns_list);
     query->set(query->storage, storage);
+    if (refresh_strategy)
+        query->set(query->refresh_strategy, refresh_strategy);
     if (comment)
         query->set(query->comment, comment);
 
@@ -1535,7 +1556,6 @@ bool ParserCreateViewQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expec
     query->set(query->select, select);
 
     return true;
-
 }
 
 bool ParserCreateNamedCollectionQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
diff --git a/src/Parsers/ParserRefreshStrategy.cpp b/src/Parsers/ParserRefreshStrategy.cpp
new file mode 100644
index 00000000000..b41473e2aa5
--- /dev/null
+++ b/src/Parsers/ParserRefreshStrategy.cpp
@@ -0,0 +1,96 @@
+#include <Parsers/ParserRefreshStrategy.h>
+
+#include <Parsers/ASTRefreshStrategy.h>
+
+#include <Parsers/ExpressionElementParsers.h>
+#include <Parsers/ExpressionListParsers.h>
+#include <Parsers/ParserSetQuery.h>
+#include <Parsers/ParserTimeInterval.h>
+#include <Parsers/CommonParsers.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int BAD_ARGUMENTS;
+}
+
+bool ParserRefreshStrategy::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
+{
+    auto refresh = std::make_shared<ASTRefreshStrategy>();
+
+    if (ParserKeyword{"AFTER"}.ignore(pos, expected))
+    {
+        refresh->schedule_kind = RefreshScheduleKind::AFTER;
+        ASTPtr period;
+        if (!ParserTimeInterval{}.parse(pos, period, expected))
+            return false;
+
+        refresh->set(refresh->period, period);
+    }
+    else if (ParserKeyword{"EVERY"}.ignore(pos, expected))
+    {
+        refresh->schedule_kind = RefreshScheduleKind::EVERY;
+        ASTPtr period;
+        if (!ParserTimeInterval{{.allow_mixing_calendar_and_clock_units = false}}.parse(pos, period, expected))
+            return false;
+        refresh->set(refresh->period, period);
+        if (ParserKeyword{"OFFSET"}.ignore(pos, expected))
+        {
+            ASTPtr periodic_offset;
+            if (!ParserTimeInterval{{.allow_zero = true}}.parse(pos, periodic_offset, expected))
+                return false;
+
+            if (periodic_offset->as<ASTTimeInterval>()->interval.maxSeconds()
+                    >= period->as<ASTTimeInterval>()->interval.minSeconds())
+                throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                    "OFFSET must be less than the period");
+
+            refresh->set(refresh->offset, periodic_offset);
+        }
+    }
+    if (refresh->schedule_kind == RefreshScheduleKind::UNKNOWN)
+        return false;
+
+    if (ParserKeyword{"RANDOMIZE FOR"}.ignore(pos, expected))
+    {
+        ASTPtr spread;
+        if (!ParserTimeInterval{{.allow_zero = true}}.parse(pos, spread, expected))
+            return false;
+
+        refresh->set(refresh->spread, spread);
+    }
+
+    if (ParserKeyword{"DEPENDS ON"}.ignore(pos, expected))
+    {
+        if (refresh->schedule_kind == RefreshScheduleKind::AFTER)
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "DEPENDS ON is allowed only for REFRESH EVERY, not REFRESH AFTER");
+
+        ASTPtr dependencies;
+
+        auto list_parser = ParserList{
+            std::make_unique<ParserCompoundIdentifier>(
+                /*table_name_with_optional_uuid_*/ true, /*allow_query_parameter_*/ false),
+            std::make_unique<ParserToken>(TokenType::Comma),
+            /*allow_empty*/ false};
+        if (!list_parser.parse(pos, dependencies, expected))
+            return false;
+        refresh->set(refresh->dependencies, dependencies);
+    }
+
+    // Refresh SETTINGS
+    if (ParserKeyword{"SETTINGS"}.ignore(pos, expected))
+    {
+        /// Settings are written like SET query, so parse them with ParserSetQuery
+        ASTPtr settings;
+        if (!ParserSetQuery{true}.parse(pos, settings, expected))
+            return false;
+        refresh->set(refresh->settings, settings);
+    }
+    node = refresh;
+    return true;
+}
+
+}
diff --git a/src/Parsers/ParserRefreshStrategy.h b/src/Parsers/ParserRefreshStrategy.h
new file mode 100644
index 00000000000..e9edabd7129
--- /dev/null
+++ b/src/Parsers/ParserRefreshStrategy.h
@@ -0,0 +1,16 @@
+#pragma once
+
+#include <Parsers/IParserBase.h>
+
+namespace DB
+{
+
+/// Parser for ASTRefreshStrategy
+class ParserRefreshStrategy : public IParserBase
+{
+protected:
+    const char * getName() const override { return "refresh strategy"; }
+    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
+};
+
+}
diff --git a/src/Parsers/ParserSelectQuery.cpp b/src/Parsers/ParserSelectQuery.cpp
index 341c1ef60b4..641e74b5f18 100644
--- a/src/Parsers/ParserSelectQuery.cpp
+++ b/src/Parsers/ParserSelectQuery.cpp
@@ -14,6 +14,7 @@
 #include <Parsers/ASTExpressionList.h>
 #include <Parsers/ASTInterpolateElement.h>
 #include <Parsers/ASTIdentifier.h>
+#include <Poco/String.h>
 
 
 namespace DB
@@ -287,6 +288,13 @@ bool ParserSelectQuery::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
                     interpolate_expression_list = std::make_shared<ASTExpressionList>();
             }
         }
+        else if (order_expression_list->children.size() == 1)
+        {
+            /// ORDER BY ALL
+            auto * identifier = order_expression_list->children[0]->as<ASTOrderByElement>()->children[0]->as<ASTIdentifier>();
+            if (identifier != nullptr && Poco::toUpper(identifier->name()) == "ALL")
+                select_query->order_by_all = true;
+        }
     }
 
     /// This is needed for TOP expression, because it can also use WITH TIES.
diff --git a/src/Parsers/ParserSystemQuery.cpp b/src/Parsers/ParserSystemQuery.cpp
index 2f6a1142a8f..a53d12c29ad 100644
--- a/src/Parsers/ParserSystemQuery.cpp
+++ b/src/Parsers/ParserSystemQuery.cpp
@@ -5,6 +5,8 @@
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTLiteral.h>
 #include <Parsers/parseDatabaseAndTableName.h>
+#include <IO/ReadBufferFromString.h>
+#include <IO/ReadHelpers.h>
 
 #include <magic_enum.hpp>
 
@@ -12,6 +14,11 @@
 namespace DB
 {
 
+namespace ErrorCodes
+{
+    extern const int SUPPORT_IS_DISABLED;
+}
+
 [[nodiscard]] static bool parseQueryWithOnClusterAndMaybeTable(std::shared_ptr<ASTSystemQuery> & res, IParser::Pos & pos,
                                                  Expected & expected, bool require_table, bool allow_string_literal)
 {
@@ -383,6 +390,40 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
             parseDatabaseAndTableAsAST(pos, expected, res->database, res->table);
             break;
 
+        case Type::REFRESH_VIEW:
+        case Type::START_VIEW:
+        case Type::STOP_VIEW:
+        case Type::CANCEL_VIEW:
+            if (!parseDatabaseAndTableAsAST(pos, expected, res->database, res->table))
+                return false;
+            break;
+
+        case Type::START_VIEWS:
+        case Type::STOP_VIEWS:
+            break;
+
+        case Type::TEST_VIEW:
+        {
+            if (!parseDatabaseAndTableAsAST(pos, expected, res->database, res->table))
+                return false;
+
+            if (ParserKeyword{"UNSET FAKE TIME"}.ignore(pos, expected))
+                break;
+
+            if (!ParserKeyword{"SET FAKE TIME"}.ignore(pos, expected))
+                return false;
+            ASTPtr ast;
+            if (!ParserStringLiteral{}.parse(pos, ast, expected))
+                return false;
+            String time_str = ast->as<ASTLiteral &>().value.get<const String &>();
+            ReadBufferFromString buf(time_str);
+            time_t time;
+            readDateTimeText(time, buf);
+            res->fake_time_for_view = Int64(time);
+
+            break;
+        }
+
         case Type::SUSPEND:
         {
             if (!parseQueryWithOnCluster(res, pos, expected))
@@ -427,6 +468,10 @@ bool ParserSystemQuery::parseImpl(IParser::Pos & pos, ASTPtr & node, Expected &
                 return false;
             break;
         }
+        case Type::DROP_DISK_METADATA_CACHE:
+        {
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Not implemented");
+        }
         case Type::DROP_SCHEMA_CACHE:
         {
             if (ParserKeyword{"FOR"}.ignore(pos, expected))
diff --git a/src/Parsers/ParserTablesInSelectQuery.cpp b/src/Parsers/ParserTablesInSelectQuery.cpp
index b3ae6ca0bb9..ca209739dad 100644
--- a/src/Parsers/ParserTablesInSelectQuery.cpp
+++ b/src/Parsers/ParserTablesInSelectQuery.cpp
@@ -6,6 +6,7 @@
 #include <Parsers/ParserSelectQuery.h>
 #include <Parsers/ParserSampleRatio.h>
 #include <Parsers/ParserTablesInSelectQuery.h>
+#include <Core/Joins.h>
 
 
 namespace DB
@@ -166,6 +167,8 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
                 table_join->kind = JoinKind::Full;
             else if (ParserKeyword("CROSS").ignore(pos))
                 table_join->kind = JoinKind::Cross;
+            else if (ParserKeyword("PASTE").ignore(pos))
+                table_join->kind = JoinKind::Paste;
             else
                 no_kind = true;
 
@@ -191,8 +194,8 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
             }
 
             if (table_join->strictness != JoinStrictness::Unspecified
-                && table_join->kind == JoinKind::Cross)
-                throw Exception(ErrorCodes::SYNTAX_ERROR, "You must not specify ANY or ALL for CROSS JOIN.");
+                && (table_join->kind == JoinKind::Cross || table_join->kind == JoinKind::Paste))
+                throw Exception(ErrorCodes::SYNTAX_ERROR, "You must not specify ANY or ALL for {} JOIN.", toString(table_join->kind));
 
             if ((table_join->strictness == JoinStrictness::Semi || table_join->strictness == JoinStrictness::Anti) &&
                 (table_join->kind != JoinKind::Left && table_join->kind != JoinKind::Right))
@@ -206,7 +209,7 @@ bool ParserTablesInSelectQueryElement::parseImpl(Pos & pos, ASTPtr & node, Expec
             return false;
 
         if (table_join->kind != JoinKind::Comma
-            && table_join->kind != JoinKind::Cross)
+            && table_join->kind != JoinKind::Cross && table_join->kind != JoinKind::Paste)
         {
             if (ParserKeyword("USING").ignore(pos, expected))
             {
diff --git a/src/Parsers/ParserTimeInterval.cpp b/src/Parsers/ParserTimeInterval.cpp
new file mode 100644
index 00000000000..8454eb27e1d
--- /dev/null
+++ b/src/Parsers/ParserTimeInterval.cpp
@@ -0,0 +1,55 @@
+#include <Parsers/ParserTimeInterval.h>
+
+#include <Parsers/ExpressionElementParsers.h>
+#include <Parsers/parseIntervalKind.h>
+
+#include <Parsers/ASTTimeInterval.h>
+#include <Parsers/ASTLiteral.h>
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int SYNTAX_ERROR;
+}
+
+ParserTimeInterval::ParserTimeInterval(Options opt) : options(opt) {}
+ParserTimeInterval::ParserTimeInterval() = default;
+
+bool ParserTimeInterval::parseImpl(Pos & pos, ASTPtr & node, Expected & expected)
+{
+    CalendarTimeInterval::Intervals intervals;
+    while (true)
+    {
+        ASTPtr value;
+        IntervalKind kind;
+        if (!ParserNumber{}.parse(pos, value, expected))
+            break;
+        if (!parseIntervalKind(pos, expected, kind))
+            return false;
+
+        UInt64 val;
+        if (!value->as<ASTLiteral &>().value.tryGet(val))
+            throw Exception(ErrorCodes::SYNTAX_ERROR, "Time interval must be an integer");
+        intervals.emplace_back(kind, val);
+    }
+
+    if (intervals.empty())
+        return false;
+
+    CalendarTimeInterval interval(intervals);
+
+    if (!options.allow_zero)
+        interval.assertPositive();
+    if (!options.allow_mixing_calendar_and_clock_units)
+        interval.assertSingleUnit();
+
+    auto time_interval = std::make_shared<ASTTimeInterval>();
+    time_interval->interval = interval;
+
+    node = time_interval;
+    return true;
+}
+
+}
diff --git a/src/Parsers/ParserTimeInterval.h b/src/Parsers/ParserTimeInterval.h
new file mode 100644
index 00000000000..2a6d7fd2534
--- /dev/null
+++ b/src/Parsers/ParserTimeInterval.h
@@ -0,0 +1,28 @@
+#pragma once
+
+#include <Parsers/IParserBase.h>
+
+namespace DB
+{
+
+/// Parser for ASTTimeInterval
+class ParserTimeInterval : public IParserBase
+{
+public:
+    struct Options
+    {
+        bool allow_mixing_calendar_and_clock_units = true;
+        bool allow_zero = false;
+    };
+
+    ParserTimeInterval();
+    explicit ParserTimeInterval(Options opt);
+
+protected:
+    Options options;
+
+    const char * getName() const override { return "time interval"; }
+    bool parseImpl(Pos & pos, ASTPtr & node, Expected & expected) override;
+};
+
+}
diff --git a/src/Parsers/obfuscateQueries.cpp b/src/Parsers/obfuscateQueries.cpp
index a6806a628bf..8012dbb37c6 100644
--- a/src/Parsers/obfuscateQueries.cpp
+++ b/src/Parsers/obfuscateQueries.cpp
@@ -1095,7 +1095,11 @@ void obfuscateIdentifier(std::string_view src, WriteBuffer & result, WordMap & o
 }
 
 
-void obfuscateLiteral(std::string_view src, WriteBuffer & result, SipHash hash_func)
+void obfuscateLiteral(
+    std::string_view src,
+    WriteBuffer & result,
+    SipHash hash_func,
+    KnownIdentifierFunc known_identifier_func)
 {
     const char * src_pos = src.data();
     const char * src_end = src_pos + src.size();
@@ -1208,15 +1212,15 @@ void obfuscateLiteral(std::string_view src, WriteBuffer & result, SipHash hash_f
         }
         else if (isAlphaASCII(src_pos[0]))
         {
-            /// Alphabetial characters
+            /// Alphabetical characters
 
             const char * alpha_end = src_pos + 1;
             while (alpha_end < src_end && isAlphaASCII(*alpha_end))
                 ++alpha_end;
 
-            String wordcopy(src_pos, alpha_end);
-            Poco::toUpperInPlace(wordcopy);
-            if (keep_words.contains(wordcopy))
+            String word(src_pos, alpha_end);
+            String wordcopy = Poco::toUpper(word);
+            if (keep_words.contains(wordcopy) || known_identifier_func(word))
             {
                 result.write(src_pos, alpha_end - src_pos);
                 src_pos = alpha_end;
@@ -1337,14 +1341,14 @@ void obfuscateQueries(
         }
         else if (token.type == TokenType::Number)
         {
-            obfuscateLiteral(whole_token, result, hash_func);
+            obfuscateLiteral(whole_token, result, hash_func, known_identifier_func);
         }
         else if (token.type == TokenType::StringLiteral)
         {
             assert(token.size() >= 2);
 
             result.write(*token.begin);
-            obfuscateLiteral({token.begin + 1, token.size() - 2}, result, hash_func);
+            obfuscateLiteral({token.begin + 1, token.size() - 2}, result, hash_func, known_identifier_func);
             result.write(token.end[-1]);
         }
         else if (token.type == TokenType::Comment)
@@ -1360,4 +1364,3 @@ void obfuscateQueries(
 }
 
 }
-
diff --git a/src/Parsers/queryNormalization.cpp b/src/Parsers/queryNormalization.cpp
new file mode 100644
index 00000000000..416e86b1f32
--- /dev/null
+++ b/src/Parsers/queryNormalization.cpp
@@ -0,0 +1,246 @@
+#include <Parsers/Lexer.h>
+#include <Parsers/queryNormalization.h>
+#include <Common/SipHash.h>
+#include <Common/StringUtils/StringUtils.h>
+
+
+namespace DB
+{
+
+UInt64 normalizedQueryHash(const char * begin, const char * end, bool keep_names)
+{
+    SipHash hash;
+    Lexer lexer(begin, end);
+
+    /// Coalesce a list of comma separated literals.
+    size_t num_literals_in_sequence = 0;
+    bool prev_comma = false;
+
+    while (true)
+    {
+        Token token = lexer.nextToken();
+
+        if (!token.isSignificant())
+            continue;
+
+        /// Literals.
+        if (token.type == TokenType::Number || token.type == TokenType::StringLiteral || token.type == TokenType::HereDoc)
+        {
+            if (0 == num_literals_in_sequence)
+                hash.update("\x00", 1);
+            ++num_literals_in_sequence;
+            prev_comma = false;
+            continue;
+        }
+        else if (token.type == TokenType::Comma)
+        {
+            if (num_literals_in_sequence)
+            {
+                prev_comma = true;
+                continue;
+            }
+        }
+        else
+        {
+            if (num_literals_in_sequence > 1)
+                hash.update("\x00", 1);
+
+            if (prev_comma)
+                hash.update(",", 1);
+
+            num_literals_in_sequence = 0;
+            prev_comma = false;
+        }
+
+        /// Slightly normalize something that look like aliases - if they are complex, replace them to `?` placeholders.
+        if (token.type == TokenType::QuotedIdentifier
+            /// Differentiate identifier from function (example: SHA224(x)).
+            /// By the way, there is padding in columns and pointer dereference is Ok.
+            || (token.type == TokenType::BareWord && *token.end != '('))
+        {
+            /// Explicitly ask to keep identifier names
+            if (keep_names)
+            {
+                hash.update(token.begin, token.size());
+            }
+            else
+            {
+                /// Identifier is complex if it contains whitespace or more than two digits
+                /// or it's at least 36 bytes long (UUID for example).
+                size_t num_digits = 0;
+
+                const char * pos = token.begin;
+                if (token.size() < 36)
+                {
+                    for (; pos != token.end; ++pos)
+                    {
+                        if (isWhitespaceASCII(*pos))
+                            break;
+
+                        if (isNumericASCII(*pos))
+                        {
+                            ++num_digits;
+                            if (num_digits > 2)
+                                break;
+                        }
+                    }
+                }
+
+                if (pos == token.end)
+                    hash.update(token.begin, token.size());
+                else
+                    hash.update("\x01", 1);
+            }
+
+            continue;
+        }
+
+        if (token.isEnd() || token.isError())
+            break;
+
+        hash.update(token.begin, token.size());
+    }
+
+    return hash.get64();
+}
+
+UInt64 normalizedQueryHash(const String & query, bool keep_names)
+{
+    return normalizedQueryHash(query.data(), query.data() + query.size(), keep_names);
+}
+
+
+void normalizeQueryToPODArray(const char * begin, const char * end, PaddedPODArray<UInt8> & res_data, bool keep_names)
+{
+    Lexer lexer(begin, end);
+    /// Coalesce whitespace characters and comments to a single whitespace.
+    bool prev_insignificant = false;
+
+    /// Coalesce a list of comma separated literals to a single '?..' sequence.
+    size_t num_literals_in_sequence = 0;
+    bool prev_comma = false;
+    bool prev_whitespace = false;
+
+    while (true)
+    {
+        Token token = lexer.nextToken();
+
+        if (!token.isSignificant())
+        {
+            /// Replace a sequence of insignificant tokens with single whitespace.
+            if (!prev_insignificant)
+            {
+                if (0 == num_literals_in_sequence)
+                {
+                    // If it's leading whitespace, ignore it altogether.
+                    if (token.begin != begin)
+                    {
+                        res_data.push_back(' ');
+                    }
+                }
+                else
+                {
+                    prev_whitespace = true;
+                }
+            }
+            prev_insignificant = true;
+            continue;
+        }
+
+        prev_insignificant = false;
+
+        /// Literals.
+        if (token.type == TokenType::Number || token.type == TokenType::StringLiteral || token.type == TokenType::HereDoc)
+        {
+            if (0 == num_literals_in_sequence)
+                res_data.push_back('?');
+            ++num_literals_in_sequence;
+            prev_whitespace = false;
+            prev_comma = false;
+            continue;
+        }
+        else if (token.type == TokenType::Comma)
+        {
+            if (num_literals_in_sequence)
+            {
+                prev_comma = true;
+                continue;
+            }
+        }
+        else
+        {
+            if (num_literals_in_sequence > 1)
+            {
+                res_data.push_back('.');
+                res_data.push_back('.');
+            }
+
+            if (prev_comma)
+                res_data.push_back(',');
+
+            if (prev_whitespace)
+                res_data.push_back(' ');
+
+            num_literals_in_sequence = 0;
+            prev_comma = false;
+            prev_whitespace = false;
+        }
+
+        /// Slightly normalize something that look like aliases - if they are complex, replace them to `?` placeholders.
+        if (token.type == TokenType::QuotedIdentifier
+            /// Differentiate identifier from function (example: SHA224(x)).
+            /// By the way, there is padding in columns and pointer dereference is Ok.
+            || (token.type == TokenType::BareWord && *token.end != '('))
+        {
+            /// Explicitly ask to normalize with identifier names
+            if (keep_names)
+            {
+                res_data.insert(token.begin, token.end);
+            }
+            else
+            {
+                /// Identifier is complex if it contains whitespace or more than two digits
+                /// or it's at least 36 bytes long (UUID for example).
+                size_t num_digits = 0;
+
+                const char * pos = token.begin;
+                if (token.size() < 36)
+                {
+                    for (; pos != token.end; ++pos)
+                    {
+                        if (isWhitespaceASCII(*pos))
+                            break;
+
+                        if (isNumericASCII(*pos))
+                        {
+                            ++num_digits;
+                            if (num_digits > 2)
+                                break;
+                        }
+                    }
+                }
+
+                if (pos == token.end)
+                {
+                    res_data.insert(token.begin, token.end);
+                }
+                else
+                {
+                    res_data.push_back('`');
+                    res_data.push_back('?');
+                    res_data.push_back('`');
+                }
+            }
+
+            continue;
+        }
+
+        if (token.isEnd() || token.isError())
+            break;
+
+        res_data.insert(token.begin, token.end);
+    }
+    res_data.push_back(0);
+}
+
+}
diff --git a/src/Parsers/queryNormalization.h b/src/Parsers/queryNormalization.h
index 23bd79c0313..6da959abd48 100644
--- a/src/Parsers/queryNormalization.h
+++ b/src/Parsers/queryNormalization.h
@@ -1,252 +1,14 @@
 #pragma once
 
 #include <base/types.h>
-
-#include <Core/Defines.h>
-#include <Parsers/Lexer.h>
 #include <Common/PODArray.h>
-#include <Common/SipHash.h>
-#include <Common/StringUtils/StringUtils.h>
+
 
 namespace DB
 {
-template <bool keep_names>
-inline UInt64 ALWAYS_INLINE normalizedQueryHash(const char * begin, const char * end)
-{
-    SipHash hash;
-    Lexer lexer(begin, end);
 
-    /// Coalesce a list of comma separated literals.
-    size_t num_literals_in_sequence = 0;
-    bool prev_comma = false;
-
-    while (true)
-    {
-        Token token = lexer.nextToken();
-
-        if (!token.isSignificant())
-            continue;
-
-        /// Literals.
-        if (token.type == TokenType::Number || token.type == TokenType::StringLiteral || token.type == TokenType::HereDoc)
-        {
-            if (0 == num_literals_in_sequence)
-                hash.update("\x00", 1);
-            ++num_literals_in_sequence;
-            prev_comma = false;
-            continue;
-        }
-        else if (token.type == TokenType::Comma)
-        {
-            if (num_literals_in_sequence)
-            {
-                prev_comma = true;
-                continue;
-            }
-        }
-        else
-        {
-            if (num_literals_in_sequence > 1)
-                hash.update("\x00", 1);
-
-            if (prev_comma)
-                hash.update(",", 1);
-
-            num_literals_in_sequence = 0;
-            prev_comma = false;
-        }
-
-        /// Slightly normalize something that look like aliases - if they are complex, replace them to `?` placeholders.
-        if (token.type == TokenType::QuotedIdentifier
-            /// Differentiate identifier from function (example: SHA224(x)).
-            /// By the way, there is padding in columns and pointer dereference is Ok.
-            || (token.type == TokenType::BareWord && *token.end != '('))
-        {
-            /// Explicitly ask to keep identifier names
-            if constexpr (keep_names)
-            {
-                hash.update(token.begin, token.size());
-            }
-            else
-            {
-                /// Identifier is complex if it contains whitespace or more than two digits
-                /// or it's at least 36 bytes long (UUID for example).
-                size_t num_digits = 0;
-
-                const char * pos = token.begin;
-                if (token.size() < 36)
-                {
-                    for (; pos != token.end; ++pos)
-                    {
-                        if (isWhitespaceASCII(*pos))
-                            break;
-
-                        if (isNumericASCII(*pos))
-                        {
-                            ++num_digits;
-                            if (num_digits > 2)
-                                break;
-                        }
-                    }
-                }
-
-                if (pos == token.end)
-                    hash.update(token.begin, token.size());
-                else
-                    hash.update("\x01", 1);
-            }
-
-            continue;
-        }
-
-        if (token.isEnd() || token.isError())
-            break;
-
-        hash.update(token.begin, token.size());
-    }
-
-    return hash.get64();
-}
-
-template <bool keep_names>
-inline UInt64 ALWAYS_INLINE normalizedQueryHash(const String & query)
-{
-    return normalizedQueryHash<keep_names>(query.data(), query.data() + query.size());
-}
-
-
-template <bool keep_names>
-inline void ALWAYS_INLINE normalizeQueryToPODArray(const char * begin, const char * end, PaddedPODArray<UInt8> & res_data)
-{
-    Lexer lexer(begin, end);
-    /// Coalesce whitespace characters and comments to a single whitespace.
-    bool prev_insignificant = false;
-
-    /// Coalesce a list of comma separated literals to a single '?..' sequence.
-    size_t num_literals_in_sequence = 0;
-    bool prev_comma = false;
-    bool prev_whitespace = false;
-
-    while (true)
-    {
-        Token token = lexer.nextToken();
-
-        if (!token.isSignificant())
-        {
-            /// Replace a sequence of insignificant tokens with single whitespace.
-            if (!prev_insignificant)
-            {
-                if (0 == num_literals_in_sequence)
-                {
-                    // If it's leading whitespace, ignore it altogether.
-                    if (token.begin != begin)
-                    {
-                        res_data.push_back(' ');
-                    }
-                }
-                else
-                {
-                    prev_whitespace = true;
-                }
-            }
-            prev_insignificant = true;
-            continue;
-        }
-
-        prev_insignificant = false;
-
-        /// Literals.
-        if (token.type == TokenType::Number || token.type == TokenType::StringLiteral || token.type == TokenType::HereDoc)
-        {
-            if (0 == num_literals_in_sequence)
-                res_data.push_back('?');
-            ++num_literals_in_sequence;
-            prev_whitespace = false;
-            prev_comma = false;
-            continue;
-        }
-        else if (token.type == TokenType::Comma)
-        {
-            if (num_literals_in_sequence)
-            {
-                prev_comma = true;
-                continue;
-            }
-        }
-        else
-        {
-            if (num_literals_in_sequence > 1)
-            {
-                res_data.push_back('.');
-                res_data.push_back('.');
-            }
-
-            if (prev_comma)
-                res_data.push_back(',');
-
-            if (prev_whitespace)
-                res_data.push_back(' ');
-
-            num_literals_in_sequence = 0;
-            prev_comma = false;
-            prev_whitespace = false;
-        }
-
-        /// Slightly normalize something that look like aliases - if they are complex, replace them to `?` placeholders.
-        if (token.type == TokenType::QuotedIdentifier
-            /// Differentiate identifier from function (example: SHA224(x)).
-            /// By the way, there is padding in columns and pointer dereference is Ok.
-            || (token.type == TokenType::BareWord && *token.end != '('))
-        {
-            /// Explicitly ask to normalize with identifier names
-            if constexpr (keep_names)
-            {
-                res_data.insert(token.begin, token.end);
-            }
-            else
-            {
-                /// Identifier is complex if it contains whitespace or more than two digits
-                /// or it's at least 36 bytes long (UUID for example).
-                size_t num_digits = 0;
-
-                const char * pos = token.begin;
-                if (token.size() < 36)
-                {
-                    for (; pos != token.end; ++pos)
-                    {
-                        if (isWhitespaceASCII(*pos))
-                            break;
-
-                        if (isNumericASCII(*pos))
-                        {
-                            ++num_digits;
-                            if (num_digits > 2)
-                                break;
-                        }
-                    }
-                }
-
-                if (pos == token.end)
-                {
-                    res_data.insert(token.begin, token.end);
-                }
-                else
-                {
-                    res_data.push_back('`');
-                    res_data.push_back('?');
-                    res_data.push_back('`');
-                }
-            }
-
-            continue;
-        }
-
-        if (token.isEnd() || token.isError())
-            break;
-
-        res_data.insert(token.begin, token.end);
-    }
-    res_data.push_back(0);
-}
+UInt64 normalizedQueryHash(const char * begin, const char * end, bool keep_names);
+UInt64 normalizedQueryHash(const String & query, bool keep_names);
+void normalizeQueryToPODArray(const char * begin, const char * end, PaddedPODArray<UInt8> & res_data, bool keep_names);
 
 }
diff --git a/src/Planner/Planner.cpp b/src/Planner/Planner.cpp
index d6e0f42a06d..d2ffd47c500 100644
--- a/src/Planner/Planner.cpp
+++ b/src/Planner/Planner.cpp
@@ -374,6 +374,7 @@ Aggregator::Params getAggregatorParams(const PlannerContextPtr & planner_context
         settings.enable_software_prefetch_in_aggregation,
         /* only_merge */ false,
         settings.optimize_group_by_constant_keys,
+        settings.min_hit_rate_to_use_consecutive_keys_optimization,
         stats_collecting_params);
 
     return aggregator_params;
@@ -476,7 +477,8 @@ void addMergingAggregatedStep(QueryPlan & query_plan,
         aggregation_analysis_result.aggregate_descriptions,
         query_analysis_result.aggregate_overflow_row,
         settings.max_threads,
-        settings.max_block_size);
+        settings.max_block_size,
+        settings.min_hit_rate_to_use_consecutive_keys_optimization);
 
     bool is_remote_storage = false;
     bool parallel_replicas_from_merge_tree = false;
@@ -1333,34 +1335,72 @@ void Planner::buildPlanForQueryNode()
     }
 
     collectSets(query_tree, *planner_context);
+
+    const auto & settings = query_context->getSettingsRef();
+    if (query_context->canUseTaskBasedParallelReplicas())
+    {
+        if (planner_context->getPreparedSets().hasSubqueries())
+        {
+            if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "IN with subquery is not supported with parallel replicas");
+
+            auto & mutable_context = planner_context->getMutableQueryContext();
+            mutable_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+            LOG_DEBUG(&Poco::Logger::get("Planner"), "Disabling parallel replicas to execute a query with IN with subquery");
+        }
+    }
+
     collectTableExpressionData(query_tree, planner_context);
     checkStoragesSupportTransactions(planner_context);
 
     if (!select_query_options.only_analyze)
         collectFiltersForAnalysis(query_tree, planner_context);
 
-    const auto & settings = query_context->getSettingsRef();
-
-    /// Check support for JOIN for parallel replicas with custom key
-    if (planner_context->getTableExpressionNodeToData().size() > 1)
+    if (query_context->canUseTaskBasedParallelReplicas())
     {
-        if (settings.allow_experimental_parallel_reading_from_replicas == 1 || !settings.parallel_replicas_custom_key.value.empty())
+        const auto & table_expression_nodes = planner_context->getTableExpressionNodeToData();
+        for (const auto & it : table_expression_nodes)
         {
-            LOG_DEBUG(
-                &Poco::Logger::get("Planner"),
-                "JOINs are not supported with parallel replicas. Query will be executed without using them.");
+            auto * table_node = it.first->as<TableNode>();
+            if (!table_node)
+                continue;
 
-            auto & mutable_context = planner_context->getMutableQueryContext();
-            mutable_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
-            mutable_context->setSetting("parallel_replicas_custom_key", String{""});
-        }
-        else if (settings.allow_experimental_parallel_reading_from_replicas == 2)
-        {
-            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "JOINs are not supported with parallel replicas");
+            const auto & modifiers = table_node->getTableExpressionModifiers();
+            if (modifiers.has_value() && modifiers->hasFinal())
+            {
+                if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                    throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "FINAL modifier is not supported with parallel replicas");
+                else
+                {
+                    LOG_DEBUG(
+                        &Poco::Logger::get("Planner"),
+                        "FINAL modifier is not supported with parallel replicas. Query will be executed without using them.");
+                    auto & mutable_context = planner_context->getMutableQueryContext();
+                    mutable_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+                }
+            }
         }
     }
 
-    /// TODO: Also disable parallel replicas in case of FINAL
+    if (query_context->canUseTaskBasedParallelReplicas() || !settings.parallel_replicas_custom_key.value.empty())
+    {
+        /// Check support for JOIN for parallel replicas with custom key
+        if (planner_context->getTableExpressionNodeToData().size() > 1)
+        {
+            if (settings.allow_experimental_parallel_reading_from_replicas == 2)
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "JOINs are not supported with parallel replicas");
+            else
+            {
+                LOG_DEBUG(
+                    &Poco::Logger::get("Planner"),
+                    "JOINs are not supported with parallel replicas. Query will be executed without using them.");
+
+                auto & mutable_context = planner_context->getMutableQueryContext();
+                mutable_context->setSetting("allow_experimental_parallel_reading_from_replicas", Field(0));
+                mutable_context->setSetting("parallel_replicas_custom_key", String{""});
+            }
+        }
+    }
 
     auto top_level_identifiers = collectTopLevelColumnIdentifiers(query_tree, planner_context);
     auto join_tree_query_plan = buildJoinTreeQueryPlan(query_tree,
diff --git a/src/Planner/PlannerActionsVisitor.cpp b/src/Planner/PlannerActionsVisitor.cpp
index 9b6034cd0de..aef6f11aa26 100644
--- a/src/Planner/PlannerActionsVisitor.cpp
+++ b/src/Planner/PlannerActionsVisitor.cpp
@@ -8,16 +8,13 @@
 #include <Analyzer/LambdaNode.h>
 #include <Analyzer/SortNode.h>
 #include <Analyzer/WindowNode.h>
-#include <Analyzer/UnionNode.h>
 #include <Analyzer/QueryNode.h>
-#include <Analyzer/ConstantValue.h>
 
 #include <DataTypes/FieldToDataType.h>
 #include <DataTypes/DataTypeSet.h>
 
 #include <Common/FieldVisitorToString.h>
 #include <DataTypes/DataTypeTuple.h>
-#include <DataTypes/DataTypeLowCardinality.h>
 
 #include <Columns/ColumnSet.h>
 #include <Columns/ColumnConst.h>
@@ -33,6 +30,7 @@
 #include <Planner/TableExpressionData.h>
 #include <Planner/Utils.h>
 
+
 namespace DB
 {
 
diff --git a/src/Planner/PlannerJoinTree.cpp b/src/Planner/PlannerJoinTree.cpp
index 53a006c2eb3..e2cdf146a69 100644
--- a/src/Planner/PlannerJoinTree.cpp
+++ b/src/Planner/PlannerJoinTree.cpp
@@ -955,6 +955,29 @@ JoinTreeQueryPlan buildQueryPlanForTableExpression(QueryTreeNodePtr table_expres
     };
 }
 
+void joinCastPlanColumnsToNullable(QueryPlan & plan_to_add_cast, PlannerContextPtr & planner_context, const FunctionOverloadResolverPtr & to_nullable_function)
+{
+    auto cast_actions_dag = std::make_shared<ActionsDAG>(plan_to_add_cast.getCurrentDataStream().header.getColumnsWithTypeAndName());
+
+    for (auto & output_node : cast_actions_dag->getOutputs())
+    {
+        if (planner_context->getGlobalPlannerContext()->hasColumnIdentifier(output_node->result_name))
+        {
+            DataTypePtr type_to_check = output_node->result_type;
+            if (const auto * type_to_check_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(type_to_check.get()))
+                type_to_check = type_to_check_low_cardinality->getDictionaryType();
+
+            if (type_to_check->canBeInsideNullable())
+                output_node = &cast_actions_dag->addFunction(to_nullable_function, {output_node}, output_node->result_name);
+        }
+    }
+
+    cast_actions_dag->projectInput();
+    auto cast_join_columns_step = std::make_unique<ExpressionStep>(plan_to_add_cast.getCurrentDataStream(), std::move(cast_actions_dag));
+    cast_join_columns_step->setStepDescription("Cast JOIN columns to Nullable");
+    plan_to_add_cast.addStep(std::move(cast_join_columns_step));
+}
+
 JoinTreeQueryPlan buildQueryPlanForJoinNode(const QueryTreeNodePtr & join_table_expression,
     JoinTreeQueryPlan left_join_tree_query_plan,
     JoinTreeQueryPlan right_join_tree_query_plan,
@@ -985,21 +1008,10 @@ JoinTreeQueryPlan buildQueryPlanForJoinNode(const QueryTreeNodePtr & join_table_
 
     std::optional<bool> join_constant;
 
-    if (join_strictness == JoinStrictness::All)
+    if (join_strictness == JoinStrictness::All || join_strictness == JoinStrictness::Semi  || join_strictness == JoinStrictness::Anti)
         join_constant = tryExtractConstantFromJoinNode(join_table_expression);
 
-    if (join_constant)
-    {
-        /** If there is JOIN with always true constant, we transform it to cross.
-          * If there is JOIN with always false constant, we do not process JOIN keys.
-          * It is expected by join algorithm to handle such case.
-          *
-          * Example: SELECT * FROM test_table AS t1 INNER JOIN test_table AS t2 ON 1;
-          */
-        if (*join_constant)
-            join_kind = JoinKind::Cross;
-    }
-    else if (join_node.isOnJoinExpression())
+    if (!join_constant && join_node.isOnJoinExpression())
     {
         join_clauses_and_actions = buildJoinClausesAndActions(left_plan_output_columns,
             right_plan_output_columns,
@@ -1079,51 +1091,38 @@ JoinTreeQueryPlan buildQueryPlanForJoinNode(const QueryTreeNodePtr & join_table_
     const auto & query_context = planner_context->getQueryContext();
     const auto & settings = query_context->getSettingsRef();
 
-    bool join_use_nulls = settings.join_use_nulls;
-    auto to_nullable_function = FunctionFactory::instance().get("toNullable", query_context);
-
-    auto join_cast_plan_columns_to_nullable = [&](QueryPlan & plan_to_add_cast)
-    {
-        auto cast_actions_dag = std::make_shared<ActionsDAG>(plan_to_add_cast.getCurrentDataStream().header.getColumnsWithTypeAndName());
-
-        for (auto & output_node : cast_actions_dag->getOutputs())
-        {
-            if (planner_context->getGlobalPlannerContext()->hasColumnIdentifier(output_node->result_name))
-            {
-                DataTypePtr type_to_check = output_node->result_type;
-                if (const auto * type_to_check_low_cardinality = typeid_cast<const DataTypeLowCardinality *>(type_to_check.get()))
-                    type_to_check = type_to_check_low_cardinality->getDictionaryType();
-
-                if (type_to_check->canBeInsideNullable())
-                    output_node = &cast_actions_dag->addFunction(to_nullable_function, {output_node}, output_node->result_name);
-            }
-        }
-
-        cast_actions_dag->projectInput();
-        auto cast_join_columns_step = std::make_unique<ExpressionStep>(plan_to_add_cast.getCurrentDataStream(), std::move(cast_actions_dag));
-        cast_join_columns_step->setStepDescription("Cast JOIN columns to Nullable");
-        plan_to_add_cast.addStep(std::move(cast_join_columns_step));
-    };
-
-    if (join_use_nulls)
+    if (settings.join_use_nulls)
     {
+        auto to_nullable_function = FunctionFactory::instance().get("toNullable", query_context);
         if (isFull(join_kind))
         {
-            join_cast_plan_columns_to_nullable(left_plan);
-            join_cast_plan_columns_to_nullable(right_plan);
+            joinCastPlanColumnsToNullable(left_plan, planner_context, to_nullable_function);
+            joinCastPlanColumnsToNullable(right_plan, planner_context, to_nullable_function);
         }
         else if (isLeft(join_kind))
         {
-            join_cast_plan_columns_to_nullable(right_plan);
+            joinCastPlanColumnsToNullable(right_plan, planner_context, to_nullable_function);
         }
         else if (isRight(join_kind))
         {
-            join_cast_plan_columns_to_nullable(left_plan);
+            joinCastPlanColumnsToNullable(left_plan, planner_context, to_nullable_function);
         }
     }
 
     auto table_join = std::make_shared<TableJoin>(settings, query_context->getGlobalTemporaryVolume());
     table_join->getTableJoin() = join_node.toASTTableJoin()->as<ASTTableJoin &>();
+
+    if (join_constant)
+    {
+        /** If there is JOIN with always true constant, we transform it to cross.
+          * If there is JOIN with always false constant, we do not process JOIN keys.
+          * It is expected by join algorithm to handle such case.
+          *
+          * Example: SELECT * FROM test_table AS t1 INNER JOIN test_table AS t2 ON 1;
+          */
+        if (*join_constant)
+            join_kind = JoinKind::Cross;
+    }
     table_join->getTableJoin().kind = join_kind;
 
     if (join_kind == JoinKind::Comma)
@@ -1312,7 +1311,7 @@ JoinTreeQueryPlan buildQueryPlanForJoinNode(const QueryTreeNodePtr & join_table_
             return step_raw_ptr;
         };
 
-        if (join_algorithm->pipelineType() == JoinPipelineType::YShaped)
+        if (join_algorithm->pipelineType() == JoinPipelineType::YShaped && join_kind != JoinKind::Paste)
         {
             const auto & join_clause = table_join->getOnlyClause();
 
diff --git a/src/Planner/PlannerJoins.cpp b/src/Planner/PlannerJoins.cpp
index 5fda2a8617d..5e9de4dedcf 100644
--- a/src/Planner/PlannerJoins.cpp
+++ b/src/Planner/PlannerJoins.cpp
@@ -35,6 +35,7 @@
 #include <Interpreters/JoinSwitcher.h>
 #include <Interpreters/ArrayJoinAction.h>
 #include <Interpreters/GraceHashJoin.h>
+#include <Interpreters/PasteJoin.h>
 
 #include <Planner/PlannerActionsVisitor.h>
 #include <Planner/PlannerContext.h>
@@ -653,6 +654,8 @@ static std::shared_ptr<IJoin> tryCreateJoin(JoinAlgorithm algorithm,
     const Block & right_table_expression_header,
     const PlannerContextPtr & planner_context)
 {
+    if (table_join->kind() == JoinKind::Paste)
+        return std::make_shared<PasteJoin>(table_join, right_table_expression_header);
     /// Direct JOIN with special storages that support key value access. For example JOIN with Dictionary
     if (algorithm == JoinAlgorithm::DIRECT || algorithm == JoinAlgorithm::DEFAULT)
     {
diff --git a/src/Planner/TableExpressionData.h b/src/Planner/TableExpressionData.h
index ee5a05fe7da..9f963dc182a 100644
--- a/src/Planner/TableExpressionData.h
+++ b/src/Planner/TableExpressionData.h
@@ -63,7 +63,7 @@ public:
     void addColumn(const NameAndTypePair & column, const ColumnIdentifier & column_identifier)
     {
         if (hasColumn(column.name))
-            throw Exception(ErrorCodes::LOGICAL_ERROR, "Column with name {} already exists");
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Column with name {} already exists", column.name);
 
         addColumnImpl(column, column_identifier);
     }
diff --git a/src/Processors/Chunk.cpp b/src/Processors/Chunk.cpp
index c91df285539..2631f665f9c 100644
--- a/src/Processors/Chunk.cpp
+++ b/src/Processors/Chunk.cpp
@@ -20,7 +20,9 @@ Chunk::Chunk(DB::Columns columns_, UInt64 num_rows_) : columns(std::move(columns
 }
 
 Chunk::Chunk(Columns columns_, UInt64 num_rows_, ChunkInfoPtr chunk_info_)
-    : columns(std::move(columns_)), num_rows(num_rows_), chunk_info(std::move(chunk_info_))
+    : columns(std::move(columns_))
+    , num_rows(num_rows_)
+    , chunk_info(std::move(chunk_info_))
 {
     checkNumRowsIsConsistent();
 }
@@ -42,7 +44,9 @@ Chunk::Chunk(MutableColumns columns_, UInt64 num_rows_)
 }
 
 Chunk::Chunk(MutableColumns columns_, UInt64 num_rows_, ChunkInfoPtr chunk_info_)
-    : columns(unmuteColumns(std::move(columns_))), num_rows(num_rows_), chunk_info(std::move(chunk_info_))
+    : columns(unmuteColumns(std::move(columns_)))
+    , num_rows(num_rows_)
+    , chunk_info(std::move(chunk_info_))
 {
     checkNumRowsIsConsistent();
 }
diff --git a/src/Processors/Executors/ExecutionThreadContext.h b/src/Processors/Executors/ExecutionThreadContext.h
index eb048f8ab09..deacd0380fa 100644
--- a/src/Processors/Executors/ExecutionThreadContext.h
+++ b/src/Processors/Executors/ExecutionThreadContext.h
@@ -43,6 +43,14 @@ public:
     const bool profile_processors;
     const bool trace_processors;
 
+    /// There is a performance optimization that schedules a task to the current thread, avoiding global task queue.
+    /// Optimization decreases contention on global task queue but may cause starvation.
+    /// See 01104_distributed_numbers_test.sql
+    /// This constant tells us that we should skip the optimization
+    /// if it was applied more than `max_scheduled_local_tasks` in a row.
+    constexpr static size_t max_scheduled_local_tasks = 128;
+    size_t num_scheduled_local_tasks = 0;
+
     void wait(std::atomic_bool & finished);
     void wakeUp();
 
diff --git a/src/Processors/Executors/ExecutorTasks.cpp b/src/Processors/Executors/ExecutorTasks.cpp
index e61d225a968..ec1fc539884 100644
--- a/src/Processors/Executors/ExecutorTasks.cpp
+++ b/src/Processors/Executors/ExecutorTasks.cpp
@@ -53,6 +53,17 @@ void ExecutorTasks::tryGetTask(ExecutionThreadContext & context)
     {
         std::unique_lock lock(mutex);
 
+    #if defined(OS_LINUX)
+        if (num_threads == 1)
+        {
+            if (auto res = async_task_queue.tryGetReadyTask(lock))
+            {
+                context.setTask(static_cast<ExecutingGraph::Node *>(res.data));
+                return;
+            }
+        }
+    #endif
+
         /// Try get async task assigned to this thread or any other task from queue.
         if (auto * async_task = context.tryPopAsyncTask())
         {
@@ -109,11 +120,15 @@ void ExecutorTasks::pushTasks(Queue & queue, Queue & async_queue, ExecutionThrea
     context.setTask(nullptr);
 
     /// Take local task from queue if has one.
-    if (!queue.empty() && !context.hasAsyncTasks())
+    if (!queue.empty() && !context.hasAsyncTasks()
+        && context.num_scheduled_local_tasks < context.max_scheduled_local_tasks)
     {
+        ++context.num_scheduled_local_tasks;
         context.setTask(queue.front());
         queue.pop();
     }
+    else
+        context.num_scheduled_local_tasks = 0;
 
     if (!queue.empty() || !async_queue.empty())
     {
diff --git a/src/Processors/Executors/PollingQueue.cpp b/src/Processors/Executors/PollingQueue.cpp
index 40f968621b1..447c102a195 100644
--- a/src/Processors/Executors/PollingQueue.cpp
+++ b/src/Processors/Executors/PollingQueue.cpp
@@ -25,7 +25,7 @@ namespace ErrorCodes
 PollingQueue::PollingQueue()
 {
     if (-1 == pipe2(pipe_fd, O_NONBLOCK))
-        throwFromErrno("Cannot create pipe", ErrorCodes::CANNOT_OPEN_FILE);
+        throw ErrnoException(ErrorCodes::CANNOT_OPEN_FILE, "Cannot create pipe");
 
     epoll.add(pipe_fd[0], pipe_fd);
 }
@@ -65,7 +65,7 @@ static std::string dumpTasks(const std::unordered_map<std::uintptr_t, PollingQue
     return res.str();
 }
 
-PollingQueue::TaskData PollingQueue::wait(std::unique_lock<std::mutex> & lock)
+PollingQueue::TaskData PollingQueue::getTask(std::unique_lock<std::mutex> & lock, int timeout)
 {
     if (is_finished)
         return {};
@@ -74,10 +74,13 @@ PollingQueue::TaskData PollingQueue::wait(std::unique_lock<std::mutex> & lock)
 
     epoll_event event;
     event.data.ptr = nullptr;
-    epoll.getManyReady(1, &event, -1);
+    size_t num_events = epoll.getManyReady(1, &event, timeout);
 
     lock.lock();
 
+    if (num_events == 0)
+        return {};
+
     if (event.data.ptr == pipe_fd)
         return {};
 
@@ -108,7 +111,7 @@ void PollingQueue::finish()
             break;
 
         if (errno != EINTR)
-            throwFromErrno("Cannot write to pipe", ErrorCodes::CANNOT_READ_FROM_SOCKET);
+            throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_SOCKET, "Cannot write to pipe");
     }
 }
 
diff --git a/src/Processors/Executors/PollingQueue.h b/src/Processors/Executors/PollingQueue.h
index 100d762b731..d709b7c9201 100644
--- a/src/Processors/Executors/PollingQueue.h
+++ b/src/Processors/Executors/PollingQueue.h
@@ -31,6 +31,8 @@ private:
     std::atomic_bool is_finished = false;
     std::unordered_map<std::uintptr_t, TaskData> tasks;
 
+    TaskData getTask(std::unique_lock<std::mutex> & lock, int timeout);
+
 public:
     PollingQueue();
     ~PollingQueue();
@@ -44,7 +46,12 @@ public:
     /// Wait for any descriptor. If no descriptors in queue, blocks.
     /// Returns ptr which was inserted into queue or nullptr if finished was called.
     /// Lock is unlocked during waiting.
-    TaskData wait(std::unique_lock<std::mutex> & lock);
+    TaskData wait(std::unique_lock<std::mutex> & lock) { return getTask(lock, -1); }
+
+    /// Get any ready descriptor.
+    /// Returns nullptr if no descriptor is ready or if finished was called.
+    /// Does not block.
+    TaskData tryGetReadyTask(std::unique_lock<std::mutex> & lock) { return getTask(lock, 0); }
 
     /// Interrupt waiting.
     void finish();
diff --git a/src/Processors/Executors/StreamingFormatExecutor.cpp b/src/Processors/Executors/StreamingFormatExecutor.cpp
index 281961f7c7c..12dd685a735 100644
--- a/src/Processors/Executors/StreamingFormatExecutor.cpp
+++ b/src/Processors/Executors/StreamingFormatExecutor.cpp
@@ -34,15 +34,13 @@ MutableColumns StreamingFormatExecutor::getResultColumns()
 
 size_t StreamingFormatExecutor::execute(ReadBuffer & buffer)
 {
-    auto & initial_buf = format->getReadBuffer();
     format->setReadBuffer(buffer);
-    size_t rows = execute();
+
     /// Format destructor can touch read buffer (for example when we use PeekableReadBuffer),
     /// but we cannot control lifetime of provided read buffer. To avoid heap use after free
-    /// we can set initial read buffer back, because initial read buffer was created before
-    /// format, so it will be destructed after it.
-    format->setReadBuffer(initial_buf);
-    return rows;
+    /// we call format->resetReadBuffer() method that resets all buffers inside format.
+    SCOPE_EXIT(format->resetReadBuffer());
+    return execute();
 }
 
 size_t StreamingFormatExecutor::execute()
diff --git a/src/Processors/Formats/IInputFormat.cpp b/src/Processors/Formats/IInputFormat.cpp
index 031b396679c..3009e91c45a 100644
--- a/src/Processors/Formats/IInputFormat.cpp
+++ b/src/Processors/Formats/IInputFormat.cpp
@@ -1,6 +1,7 @@
 #include <Processors/Formats/IInputFormat.h>
 #include <IO/ReadBuffer.h>
-
+#include <IO/WithFileName.h>
+#include <Common/Exception.h>
 
 namespace DB
 {
@@ -11,6 +12,21 @@ IInputFormat::IInputFormat(Block header, ReadBuffer * in_)
     column_mapping = std::make_shared<ColumnMapping>();
 }
 
+Chunk IInputFormat::generate()
+{
+    try
+    {
+        return read();
+    }
+    catch (Exception & e)
+    {
+        auto file_name = getFileNameFromReadBuffer(getReadBuffer());
+        if (!file_name.empty())
+            e.addMessage(fmt::format("(in file/uri {})", file_name));
+        throw;
+    }
+}
+
 void IInputFormat::resetParser()
 {
     chassert(in);
@@ -24,7 +40,6 @@ void IInputFormat::resetParser()
 
 void IInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    chassert(in); // not supported by random-access formats
     in = &in_;
 }
 
diff --git a/src/Processors/Formats/IInputFormat.h b/src/Processors/Formats/IInputFormat.h
index 5afc24c9298..713c1089d28 100644
--- a/src/Processors/Formats/IInputFormat.h
+++ b/src/Processors/Formats/IInputFormat.h
@@ -27,6 +27,11 @@ public:
     /// ReadBuffer can be nullptr for random-access formats.
     IInputFormat(Block header, ReadBuffer * in_);
 
+    Chunk generate() override;
+
+    /// All data reading from the read buffer must be performed by this method.
+    virtual Chunk read() = 0;
+
     /** In some usecase (hello Kafka) we need to read a lot of tiny streams in exactly the same format.
      * The recreating of parser for each small stream takes too long, so we introduce a method
      * resetParser() which allow to reset the state of parser to continue reading of
@@ -36,7 +41,7 @@ public:
     virtual void resetParser();
 
     virtual void setReadBuffer(ReadBuffer & in_);
-    ReadBuffer & getReadBuffer() const { chassert(in); return *in; }
+    virtual void resetReadBuffer() { in = nullptr; }
 
     virtual const BlockMissingValues & getMissingValues() const
     {
@@ -49,8 +54,9 @@ public:
     /// Must be called from ParallelParsingInputFormat before readPrefix
     void setColumnMapping(ColumnMappingPtr column_mapping_) { column_mapping = column_mapping_; }
 
-    size_t getCurrentUnitNumber() const { return current_unit_number; }
-    void setCurrentUnitNumber(size_t current_unit_number_) { current_unit_number = current_unit_number_; }
+    /// Set the number of rows that was already read in
+    /// parallel parsing before creating this parser.
+    virtual void setRowsReadBefore(size_t /*rows*/) {}
 
     void addBuffer(std::unique_ptr<ReadBuffer> buffer) { owned_buffers.emplace_back(std::move(buffer)); }
 
@@ -61,6 +67,8 @@ public:
     void needOnlyCount() { need_only_count = true; }
 
 protected:
+    ReadBuffer & getReadBuffer() const { chassert(in); return *in; }
+
     virtual Chunk getChunkForCount(size_t rows);
 
     ColumnMappingPtr column_mapping{};
@@ -70,9 +78,6 @@ protected:
     bool need_only_count = false;
 
 private:
-    /// Number of currently parsed chunk (if parallel parsing is enabled)
-    size_t current_unit_number = 0;
-
     std::vector<std::unique_ptr<ReadBuffer>> owned_buffers;
 };
 
diff --git a/src/Processors/Formats/IRowInputFormat.cpp b/src/Processors/Formats/IRowInputFormat.cpp
index 87febb6d46b..5f27fa78c55 100644
--- a/src/Processors/Formats/IRowInputFormat.cpp
+++ b/src/Processors/Formats/IRowInputFormat.cpp
@@ -83,7 +83,7 @@ void IRowInputFormat::logError()
     errors_logger->logError(InputFormatErrorsLogger::ErrorEntry{now_time, total_rows, diagnostic, raw_data});
 }
 
-Chunk IRowInputFormat::generate()
+Chunk IRowInputFormat::read()
 {
     if (total_rows == 0)
     {
@@ -93,10 +93,6 @@ Chunk IRowInputFormat::generate()
         }
         catch (Exception & e)
         {
-            auto file_name = getFileNameFromReadBuffer(getReadBuffer());
-            if (!file_name.empty())
-                e.addMessage(fmt::format("(in file/uri {})", file_name));
-
             e.addMessage("(while reading header)");
             throw;
         }
@@ -128,12 +124,10 @@ Chunk IRowInputFormat::generate()
 
         RowReadExtension info;
         bool continue_reading = true;
-        for (size_t rows = 0; rows < params.max_block_size && continue_reading; ++rows)
+        for (size_t rows = 0; (rows < params.max_block_size || num_rows == 0) && continue_reading; ++rows)
         {
             try
             {
-                ++total_rows;
-
                 info.read_columns.clear();
                 continue_reading = readRow(columns, info);
 
@@ -148,6 +142,8 @@ Chunk IRowInputFormat::generate()
                     }
                 }
 
+                ++total_rows;
+
                 /// Some formats may read row AND say the read is finished.
                 /// For such a case, get the number or rows from first column.
                 if (!columns.empty())
@@ -162,6 +158,8 @@ Chunk IRowInputFormat::generate()
             }
             catch (Exception & e)
             {
+                ++total_rows;
+
                 /// Logic for possible skipping of errors.
 
                 if (!isParseError(e.code()))
@@ -204,27 +202,6 @@ Chunk IRowInputFormat::generate()
             }
         }
     }
-    catch (ParsingException & e)
-    {
-        String verbose_diagnostic;
-        try
-        {
-            verbose_diagnostic = getDiagnosticInfo();
-        }
-        catch (const Exception & exception)
-        {
-            verbose_diagnostic = "Cannot get verbose diagnostic: " + exception.message();
-        }
-        catch (...) // NOLINT(bugprone-empty-catch)
-        {
-            /// Error while trying to obtain verbose diagnostic. Ok to ignore.
-        }
-
-        e.setFileName(getFileNameFromReadBuffer(getReadBuffer()));
-        e.setLineNumber(static_cast<int>(total_rows));
-        e.addMessage(verbose_diagnostic);
-        throw;
-    }
     catch (Exception & e)
     {
         if (!isParseError(e.code()))
@@ -244,10 +221,6 @@ Chunk IRowInputFormat::generate()
             /// Error while trying to obtain verbose diagnostic. Ok to ignore.
         }
 
-        auto file_name = getFileNameFromReadBuffer(getReadBuffer());
-        if (!file_name.empty())
-            e.addMessage(fmt::format("(in file/uri {})", file_name));
-
         e.addMessage(fmt::format("(at row {})\n", total_rows));
         e.addMessage(verbose_diagnostic);
         throw;
diff --git a/src/Processors/Formats/IRowInputFormat.h b/src/Processors/Formats/IRowInputFormat.h
index 1b48647a224..f8796df8604 100644
--- a/src/Processors/Formats/IRowInputFormat.h
+++ b/src/Processors/Formats/IRowInputFormat.h
@@ -42,7 +42,7 @@ public:
 
     IRowInputFormat(Block header, ReadBuffer & in_, Params params_);
 
-    Chunk generate() override;
+    Chunk read() override;
 
     void resetParser() override;
 
@@ -79,10 +79,12 @@ protected:
 
     const BlockMissingValues & getMissingValues() const override { return block_missing_values; }
 
-    size_t getTotalRows() const { return total_rows; }
+    size_t getRowNum() const { return total_rows; }
 
     size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
 
+    void setRowsReadBefore(size_t rows) override { total_rows = rows; }
+
     Serializations serializations;
 
 private:
diff --git a/src/Processors/Formats/ISchemaReader.cpp b/src/Processors/Formats/ISchemaReader.cpp
index 15b53c2a499..26c632b83dc 100644
--- a/src/Processors/Formats/ISchemaReader.cpp
+++ b/src/Processors/Formats/ISchemaReader.cpp
@@ -2,6 +2,7 @@
 #include <Formats/SchemaInferenceUtils.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/getLeastSupertype.h>
 #include <Common/logger_useful.h>
 #include <Interpreters/parseColumnsListForTableFunction.h>
 #include <boost/algorithm/string.hpp>
@@ -62,6 +63,14 @@ void checkFinalInferredType(
         type = removeNullable(type);
 }
 
+void ISchemaReader::transformTypesIfNeeded(DB::DataTypePtr & type, DB::DataTypePtr & new_type)
+{
+    DataTypes types = {type, new_type};
+    auto least_supertype = tryGetLeastSupertype(types);
+    if (least_supertype)
+        type = new_type = least_supertype;
+}
+
 IIRowSchemaReader::IIRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_, DataTypePtr default_type_)
     : ISchemaReader(in_)
     , max_rows_to_read(format_settings_.max_rows_to_read_for_schema_inference)
@@ -86,11 +95,6 @@ void IIRowSchemaReader::setContext(ContextPtr & context)
     }
 }
 
-void IIRowSchemaReader::transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type)
-{
-    transformInferredTypesIfNeeded(type, new_type, format_settings);
-}
-
 IRowSchemaReader::IRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_)
     : IIRowSchemaReader(in_, format_settings_), column_names(splitColumnNames(format_settings.column_names_for_schema_inference))
 {
diff --git a/src/Processors/Formats/ISchemaReader.h b/src/Processors/Formats/ISchemaReader.h
index e6402ac0249..94df71a88b4 100644
--- a/src/Processors/Formats/ISchemaReader.h
+++ b/src/Processors/Formats/ISchemaReader.h
@@ -39,6 +39,9 @@ public:
     virtual void setMaxRowsAndBytesToRead(size_t, size_t) {}
     virtual size_t getNumRowsRead() const { return 0; }
 
+    virtual void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type);
+    virtual void transformTypesFromDifferentFilesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) { transformTypesIfNeeded(type, new_type); }
+
     virtual ~ISchemaReader() = default;
 
 protected:
@@ -55,8 +58,6 @@ public:
     bool needContext() const override { return !hints_str.empty(); }
     void setContext(ContextPtr & context) override;
 
-    virtual void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type);
-
 protected:
     void setMaxRowsAndBytesToRead(size_t max_rows, size_t max_bytes) override
     {
diff --git a/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp b/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp
index bac6c540381..206e244c75f 100644
--- a/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ArrowBlockInputFormat.cpp
@@ -28,7 +28,7 @@ ArrowBlockInputFormat::ArrowBlockInputFormat(ReadBuffer & in_, const Block & hea
 {
 }
 
-Chunk ArrowBlockInputFormat::generate()
+Chunk ArrowBlockInputFormat::read()
 {
     Chunk res;
     block_missing_values.clear();
@@ -64,7 +64,7 @@ Chunk ArrowBlockInputFormat::generate()
         {
             auto rows = file_reader->RecordBatchCountRows(record_batch_current++);
             if (!rows.ok())
-                throw ParsingException(
+                throw Exception(
                     ErrorCodes::CANNOT_READ_ALL_DATA, "Error while reading batch of Arrow data: {}", rows.status().ToString());
             return getChunkForCount(*rows);
         }
@@ -73,12 +73,12 @@ Chunk ArrowBlockInputFormat::generate()
     }
 
     if (!batch_result.ok())
-        throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA,
+        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA,
             "Error while reading batch of Arrow data: {}", batch_result.status().ToString());
 
     auto table_result = arrow::Table::FromRecordBatches({*batch_result});
     if (!table_result.ok())
-        throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA,
+        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA,
             "Error while reading batch of Arrow data: {}", table_result.status().ToString());
 
     ++record_batch_current;
@@ -213,7 +213,7 @@ std::optional<size_t> ArrowSchemaReader::readNumberOrRows()
 
     auto rows = file_reader->CountRows();
     if (!rows.ok())
-        throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while reading batch of Arrow data: {}", rows.status().ToString());
+        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while reading batch of Arrow data: {}", rows.status().ToString());
 
     return *rows;
 }
diff --git a/src/Processors/Formats/Impl/ArrowBlockInputFormat.h b/src/Processors/Formats/Impl/ArrowBlockInputFormat.h
index 06a7b470312..cdbc5e57e4e 100644
--- a/src/Processors/Formats/Impl/ArrowBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ArrowBlockInputFormat.h
@@ -30,7 +30,7 @@ public:
     size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
 
 private:
-    Chunk generate() override;
+    Chunk read() override;
 
     void onCancel() override
     {
diff --git a/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp b/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp
index 37505f94e98..83d7a8b7bbd 100644
--- a/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp
+++ b/src/Processors/Formats/Impl/ArrowBufferedStreams.cpp
@@ -7,7 +7,6 @@
 #include <IO/ReadBufferFromFileDescriptor.h>
 #include <IO/WriteBufferFromString.h>
 #include <IO/copyData.h>
-#include <IO/PeekableReadBuffer.h>
 #include <arrow/buffer.h>
 #include <arrow/util/future.h>
 #include <arrow/io/memory.h>
diff --git a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
index 50e9ece0399..ce2e9e6571d 100644
--- a/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
+++ b/src/Processors/Formats/Impl/ArrowColumnToCHColumn.cpp
@@ -14,6 +14,7 @@
 #include <DataTypes/DataTypeDate32.h>
 #include <DataTypes/DataTypeDate.h>
 #include <DataTypes/NestedUtils.h>
+#include <DataTypes/DataTypeNested.h>
 #include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/DataTypeNothing.h>
 #include <DataTypes/DataTypeFixedString.h>
@@ -879,8 +880,19 @@ static ColumnWithTypeAndName readColumnFromArrowColumn(
                 return {};
             auto offsets_column = is_large ? readOffsetsFromArrowListColumn<arrow::LargeListArray>(arrow_column) : readOffsetsFromArrowListColumn<arrow::ListArray>(arrow_column);
             auto array_column = ColumnArray::create(nested_column.column, offsets_column);
-            auto array_type = std::make_shared<DataTypeArray>(nested_column.type);
-            return {std::move(array_column), std::move(array_type), column_name};
+            DataTypePtr array_type;
+            /// If type hint is Nested, we should return Nested type,
+            /// because we differentiate Nested and simple Array(Tuple)
+            if (type_hint && isNested(type_hint))
+            {
+                const auto & tuple_type = assert_cast<const DataTypeTuple &>(*nested_column.type);
+                array_type = createNested(tuple_type.getElements(), tuple_type.getElementNames());
+            }
+            else
+            {
+                array_type = std::make_shared<DataTypeArray>(nested_column.type);
+            }
+            return {std::move(array_column), array_type, column_name};
         }
         case arrow::Type::STRUCT:
         {
diff --git a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
index b4d2605e871..46d1c426ef4 100644
--- a/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/AvroRowInputFormat.cpp
@@ -186,7 +186,7 @@ static AvroDeserializer::DeserializeFn createDecimalDeserializeFn(const avro::No
             tmp = decoder.decodeBytes();
 
         if (tmp.size() > field_type_size || tmp.empty())
-            throw ParsingException(
+            throw Exception(
                 ErrorCodes::CANNOT_PARSE_UUID,
                 "Cannot parse type {}, expected non-empty binary data with size equal to or less than {}, got {}",
                 target_type->getName(),
@@ -274,7 +274,7 @@ AvroDeserializer::DeserializeFn AvroDeserializer::createDeserializeFn(const avro
                 {
                     decoder.decodeString(tmp);
                     if (tmp.length() != 36)
-                        throw ParsingException(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse uuid {}", tmp);
+                        throw Exception(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse uuid {}", tmp);
 
                     const UUID uuid = parseUUID({reinterpret_cast<const UInt8 *>(tmp.data()), tmp.length()});
                     assert_cast<DataTypeUUID::ColumnType &>(column).insertValue(uuid);
@@ -530,7 +530,7 @@ AvroDeserializer::DeserializeFn AvroDeserializer::createDeserializeFn(const avro
                 {
                     decoder.decodeFixed(fixed_size, tmp);
                     if (tmp.size() != 36)
-                        throw ParsingException(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse UUID from type Fixed, because it's size ({}) is not equal to the size of UUID (36)", fixed_size);
+                        throw Exception(ErrorCodes::CANNOT_PARSE_UUID, "Cannot parse UUID from type Fixed, because it's size ({}) is not equal to the size of UUID (36)", fixed_size);
 
                     const UUID uuid = parseUUID({reinterpret_cast<const UInt8 *>(tmp.data()), tmp.size()});
                     assert_cast<DataTypeUUID::ColumnType &>(column).insertValue(uuid);
@@ -1289,7 +1289,7 @@ DataTypePtr AvroSchemaReader::avroNodeToDataType(avro::NodePtr node)
         case avro::Type::AVRO_MAP:
             return std::make_shared<DataTypeMap>(avroNodeToDataType(node->leafAt(0)), avroNodeToDataType(node->leafAt(1)));
         default:
-            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Avro column {} is not supported for inserting.");
+            throw Exception(ErrorCodes::ILLEGAL_COLUMN, "Avro column {} is not supported for inserting.", nodeName(node));
     }
 }
 
diff --git a/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp
index b38aaa426fd..340bcc8aae5 100644
--- a/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.cpp
@@ -1031,17 +1031,17 @@ fileSegmentationEngineBSONEachRow(ReadBuffer & in, DB::Memory<> & memory, size_t
         readBinaryLittleEndian(document_size, in);
 
         if (document_size < sizeof(document_size))
-            throw ParsingException(ErrorCodes::INCORRECT_DATA, "Size of BSON document is invalid");
+            throw Exception(ErrorCodes::INCORRECT_DATA, "Size of BSON document is invalid");
 
         if (min_bytes != 0 && document_size > 10 * min_bytes)
-            throw ParsingException(
+            throw Exception(
                 ErrorCodes::INCORRECT_DATA,
                 "Size of BSON document is extremely large. Expected not greater than {} bytes, but current is {} bytes per row. Increase "
                 "the value setting 'min_chunk_bytes_for_parallel_parsing' or check your data manually, most likely BSON is malformed",
                 min_bytes, document_size);
 
         if (document_size < sizeof(document_size))
-            throw ParsingException(ErrorCodes::INCORRECT_DATA, "Size of BSON document is invalid");
+            throw Exception(ErrorCodes::INCORRECT_DATA, "Size of BSON document is invalid");
 
         size_t old_size = memory.size();
         memory.resize(old_size + document_size);
diff --git a/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.h b/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.h
index 5e8bee50963..a1f197557b4 100644
--- a/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.h
+++ b/src/Processors/Formats/Impl/BSONEachRowRowInputFormat.h
@@ -57,9 +57,6 @@ public:
     void resetParser() override;
 
 private:
-    void readPrefix() override { }
-    void readSuffix() override { }
-
     bool readRow(MutableColumns & columns, RowReadExtension & ext) override;
     bool allowSyncAfterError() const override { return true; }
     void syncAfterError() override;
diff --git a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
index 5e12ec18d27..2c0a2524357 100644
--- a/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/CSVRowInputFormat.cpp
@@ -106,13 +106,14 @@ void CSVRowInputFormat::syncAfterError()
 
 void CSVRowInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    buf->setSubBuffer(in_);
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    RowInputFormatWithNamesAndTypes::setReadBuffer(*buf);
 }
 
-void CSVRowInputFormat::resetParser()
+void CSVRowInputFormat::resetReadBuffer()
 {
-    RowInputFormatWithNamesAndTypes::resetParser();
-    buf->reset();
+    buf.reset();
+    RowInputFormatWithNamesAndTypes::resetReadBuffer();
 }
 
 void CSVFormatReader::skipRow()
diff --git a/src/Processors/Formats/Impl/CSVRowInputFormat.h b/src/Processors/Formats/Impl/CSVRowInputFormat.h
index 4b87410e983..c4b3c8feb8c 100644
--- a/src/Processors/Formats/Impl/CSVRowInputFormat.h
+++ b/src/Processors/Formats/Impl/CSVRowInputFormat.h
@@ -27,7 +27,7 @@ public:
     String getName() const override { return "CSVRowInputFormat"; }
 
     void setReadBuffer(ReadBuffer & in_) override;
-    void resetParser() override;
+    void resetReadBuffer() override;
 
 protected:
     CSVRowInputFormat(const Block & header_, std::shared_ptr<PeekableReadBuffer> in_, const Params & params_,
diff --git a/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp b/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp
index 88510b96ae5..6d73abfe840 100644
--- a/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.cpp
@@ -91,7 +91,14 @@ void CustomSeparatedRowInputFormat::syncAfterError()
 
 void CustomSeparatedRowInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    buf->setSubBuffer(in_);
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    RowInputFormatWithNamesAndTypes::setReadBuffer(*buf);
+}
+
+void CustomSeparatedRowInputFormat::resetReadBuffer()
+{
+    buf.reset();
+    RowInputFormatWithNamesAndTypes::resetReadBuffer();
 }
 
 CustomSeparatedFormatReader::CustomSeparatedFormatReader(
@@ -100,12 +107,6 @@ CustomSeparatedFormatReader::CustomSeparatedFormatReader(
 {
 }
 
-void CustomSeparatedRowInputFormat::resetParser()
-{
-    RowInputFormatWithNamesAndTypes::resetParser();
-    buf->reset();
-}
-
 void CustomSeparatedFormatReader::skipPrefixBeforeHeader()
 {
     skipSpaces();
diff --git a/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.h b/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.h
index 5ad870199db..ab16aaa56ad 100644
--- a/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.h
+++ b/src/Processors/Formats/Impl/CustomSeparatedRowInputFormat.h
@@ -18,9 +18,9 @@ public:
         const Params & params_,
         bool with_names_, bool with_types_, bool ignore_spaces_, const FormatSettings & format_settings_);
 
-    void resetParser() override;
     String getName() const override { return "CustomSeparatedRowInputFormat"; }
     void setReadBuffer(ReadBuffer & in_) override;
+    void resetReadBuffer() override;
 
 private:
     CustomSeparatedRowInputFormat(
diff --git a/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp b/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp
index 19ed5c94dfd..43ef2521032 100644
--- a/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/DWARFBlockInputFormat.cpp
@@ -308,6 +308,41 @@ static inline void throwIfError(llvm::Error & e, const char * what)
     throw Exception(ErrorCodes::CANNOT_PARSE_DWARF, "Failed to parse {}: {}", what, llvm::toString(std::move(e)));
 }
 
+llvm::DWARFFormValue DWARFBlockInputFormat::parseAttribute(
+    const llvm::DWARFAbbreviationDeclaration::AttributeSpec & attr, uint64_t * offset,
+    const UnitState & unit) const
+{
+    auto val = llvm::DWARFFormValue::createFromSValue(
+        attr.Form, attr.isImplicitConst() ? attr.getImplicitConstValue() : 0);
+    if (!val.extractValue(*extractor, offset, unit.dwarf_unit->getFormParams(), unit.dwarf_unit))
+        throw Exception(ErrorCodes::CANNOT_PARSE_DWARF,
+            "Failed to parse attribute {} of form {} at offset {}",
+                llvm::dwarf::AttributeString(attr.Attr), attr.Form, *offset);
+    return val;
+}
+
+void DWARFBlockInputFormat::skipAttribute(
+    const llvm::DWARFAbbreviationDeclaration::AttributeSpec & attr, uint64_t * offset,
+    const UnitState & unit) const
+{
+    if (!llvm::DWARFFormValue::skipValue(
+        attr.Form, *extractor, offset, unit.dwarf_unit->getFormParams()))
+            throw Exception(ErrorCodes::CANNOT_PARSE_DWARF,
+                "Failed to skip attribute {} of form {} at offset {}",
+                llvm::dwarf::AttributeString(attr.Attr), attr.Form, *offset);
+}
+
+uint64_t DWARFBlockInputFormat::parseAddress(llvm::dwarf::Attribute attr, const llvm::DWARFFormValue & val, const UnitState & unit)
+{
+    if (val.getForm() == llvm::dwarf::DW_FORM_addr)
+        return val.getRawUValue();
+    if (val.getForm() == llvm::dwarf::DW_FORM_addrx ||
+        (val.getForm() >= llvm::dwarf::DW_FORM_addrx1 &&
+         val.getForm() <= llvm::dwarf::DW_FORM_addrx4))
+        return fetchFromDebugAddr(unit.debug_addr_base, val.getRawUValue());
+    throw Exception(ErrorCodes::CANNOT_PARSE_DWARF, "Form {} for {} is not supported", llvm::dwarf::FormEncodingString(val.getForm()), llvm::dwarf::AttributeString(attr));
+}
+
 Chunk DWARFBlockInputFormat::parseEntries(UnitState & unit)
 {
     const auto & header = getPort().getHeader();
@@ -315,7 +350,6 @@ Chunk DWARFBlockInputFormat::parseEntries(UnitState & unit)
     std::array<bool, COL_COUNT> need{};
     for (const std::string & name : header.getNames())
         need[column_name_to_idx.at(name)] = true;
-    auto form_params = unit.dwarf_unit->getFormParams();
 
     /// For parallel arrays, we nominate one of them to be responsible for populating the offsets vector.
     need[COL_ATTR_NAME] = need[COL_ATTR_NAME] || need[COL_ATTR_FORM] || need[COL_ATTR_INT] || need[COL_ATTR_STR];
@@ -390,6 +424,34 @@ Chunk DWARFBlockInputFormat::parseEntries(UnitState & unit)
             if (need[COL_TAG])
                 col_tag->insertValue(tag);
 
+            if (tag == llvm::dwarf::DW_TAG_compile_unit)
+            {
+                /// Pre-parse DW_AT_addr_base and DW_AT_rnglists_base because other attributes may
+                /// rely on them. (Why couldn't DWARF just promise that these attributes must appear
+                /// before any attributes that depend on them?)
+                uint64_t offset = unit.offset;
+                std::optional<llvm::DWARFFormValue> low_pc;
+                for (auto attr : abbrev->attributes())
+                {
+                    if (attr.Attr == llvm::dwarf::DW_AT_addr_base ||
+                        attr.Attr == llvm::dwarf::DW_AT_rnglists_base)
+                    {
+                        auto val = parseAttribute(attr, &offset, unit);
+                        if (attr.Attr == llvm::dwarf::DW_AT_addr_base)
+                            unit.debug_addr_base = val.getRawUValue();
+                        else
+                            unit.rnglists_base = val.getRawUValue();
+                    }
+                    else if (attr.Attr == llvm::dwarf::DW_AT_low_pc)
+                        low_pc = parseAttribute(attr, &offset, unit);
+                    else
+                        skipAttribute(attr, &offset, unit);
+                }
+                /// May use addr_base.
+                if (low_pc.has_value())
+                    unit.base_address = parseAddress(llvm::dwarf::DW_AT_low_pc, *low_pc, unit);
+            }
+
             bool need_name = need[COL_NAME];
             bool need_linkage_name = need[COL_LINKAGE_NAME];
             bool need_decl_file = need[COL_DECL_FILE];
@@ -410,11 +472,7 @@ Chunk DWARFBlockInputFormat::parseEntries(UnitState & unit)
 
             for (auto attr : abbrev->attributes())
             {
-                auto val = llvm::DWARFFormValue::createFromSValue(attr.Form, attr.isImplicitConst() ? attr.getImplicitConstValue() : 0);
-                /// This is relatively slow, maybe we should reimplement it.
-                if (!val.extractValue(*extractor, &unit.offset, form_params, unit.dwarf_unit))
-                    throw Exception(ErrorCodes::CANNOT_PARSE_DWARF, "Failed to parse attribute {} of form {} at offset {}",
-                        llvm::dwarf::AttributeString(attr.Attr), attr.Form, unit.offset);
+                auto val = parseAttribute(attr, &unit.offset, unit);
 
                 if (need[COL_ATTR_NAME])
                     col_attr_name->insertValue(attr.Attr);
@@ -452,13 +510,6 @@ Chunk DWARFBlockInputFormat::parseEntries(UnitState & unit)
                         if (attr.Attr == llvm::dwarf::DW_AT_decl_line && std::exchange(need_decl_line, false))
                             col_decl_line->insertValue(static_cast<UInt32>(val.getRawUValue()));
 
-                        /// Starting offset of this unit's data in .debug_addr section.
-                        if (attr.Attr == llvm::dwarf::DW_AT_addr_base)
-                            unit.addr_base = val.getRawUValue();
-                        /// Same for .debug_rnglists section.
-                        if (attr.Attr == llvm::dwarf::DW_AT_rnglists_base)
-                            unit.rnglists_base = val.getRawUValue();
-
                         if (attr.Attr == llvm::dwarf::DW_AT_high_pc)
                         {
                             high_pc = val.getRawUValue();
@@ -515,16 +566,7 @@ Chunk DWARFBlockInputFormat::parseEntries(UnitState & unit)
 
                         if (need_ranges && (attr.Attr == llvm::dwarf::DW_AT_low_pc || attr.Attr == llvm::dwarf::DW_AT_high_pc))
                         {
-                            UInt64 addr;
-                            if (val.getForm() == llvm::dwarf::DW_FORM_addr)
-                                addr = val.getRawUValue();
-                            else if (val.getForm() == llvm::dwarf::DW_FORM_addrx ||
-                                (val.getForm() >= llvm::dwarf::DW_FORM_addrx1 &&
-                                 val.getForm() <= llvm::dwarf::DW_FORM_addrx4))
-                                addr = fetchFromDebugAddr(unit.addr_base, val.getRawUValue());
-                            else
-                                throw Exception(ErrorCodes::CANNOT_PARSE_DWARF, "Form {} for {} is not supported", llvm::dwarf::FormEncodingString(val.getForm()), llvm::dwarf::AttributeString(attr.Attr));
-
+                            UInt64 addr = parseAddress(attr.Attr, val, unit);
                             if (attr.Attr == llvm::dwarf::DW_AT_low_pc)
                                 low_pc = addr;
                             else
@@ -618,7 +660,7 @@ Chunk DWARFBlockInputFormat::parseEntries(UnitState & unit)
             if (need_ranges)
             {
                 if (ranges.has_value())
-                    parseRanges(*ranges, ranges_rnglistx, low_pc, unit, col_ranges_start, col_ranges_end);
+                    parseRanges(*ranges, ranges_rnglistx, unit, col_ranges_start, col_ranges_end);
                 else if (low_pc.has_value())
                 {
                     UInt64 high;
@@ -740,7 +782,7 @@ void DWARFBlockInputFormat::parseFilenameTable(UnitState & unit, uint64_t offset
     auto error = prologue.parse(*debug_line_extractor, &offset, /*RecoverableErrorHandler*/ [&](auto e)
         {
             if (++seen_debug_line_warnings < 10)
-                LOG_INFO(&Poco::Logger::get("DWARF"), "{}", llvm::toString(std::move(e)));
+                LOG_INFO(&Poco::Logger::get("DWARF"), "Parsing error: {}", llvm::toString(std::move(e)));
         }, *dwarf_context, unit.dwarf_unit);
 
     if (error)
@@ -783,12 +825,12 @@ uint64_t DWARFBlockInputFormat::fetchFromDebugAddr(uint64_t addr_base, uint64_t
 }
 
 void DWARFBlockInputFormat::parseRanges(
-    uint64_t offset, bool form_rnglistx, std::optional<uint64_t> low_pc, const UnitState & unit, const ColumnVector<UInt64>::MutablePtr & col_ranges_start,
+    uint64_t offset, bool form_rnglistx, const UnitState & unit, const ColumnVector<UInt64>::MutablePtr & col_ranges_start,
     const ColumnVector<UInt64>::MutablePtr & col_ranges_end) const
 {
     llvm::Optional<llvm::object::SectionedAddress> base_addr;
-    if (low_pc.has_value())
-        base_addr = llvm::object::SectionedAddress{.Address = *low_pc};
+    if (unit.base_address != UINT64_MAX)
+        base_addr = llvm::object::SectionedAddress{.Address = unit.base_address};
 
     llvm::DWARFAddressRangesVector ranges;
 
@@ -833,7 +875,7 @@ void DWARFBlockInputFormat::parseRanges(
 
         auto lookup_addr = [&](uint32_t idx) -> llvm::Optional<llvm::object::SectionedAddress>
             {
-                uint64_t addr = fetchFromDebugAddr(unit.addr_base, idx);
+                uint64_t addr = fetchFromDebugAddr(unit.debug_addr_base, idx);
                 return llvm::object::SectionedAddress{.Address = addr};
             };
         ranges = list.getAbsoluteRanges(base_addr, /*AddressByteSize*/ 8, lookup_addr);
@@ -846,7 +888,7 @@ void DWARFBlockInputFormat::parseRanges(
     }
 }
 
-Chunk DWARFBlockInputFormat::generate()
+Chunk DWARFBlockInputFormat::read()
 {
     initializeIfNeeded();
 
diff --git a/src/Processors/Formats/Impl/DWARFBlockInputFormat.h b/src/Processors/Formats/Impl/DWARFBlockInputFormat.h
index 07c00656e4d..0345a264d47 100644
--- a/src/Processors/Formats/Impl/DWARFBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/DWARFBlockInputFormat.h
@@ -30,7 +30,7 @@ public:
     size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
 
 protected:
-    Chunk generate() override;
+    Chunk read() override;
 
     void onCancel() override
     {
@@ -53,8 +53,11 @@ private:
         std::string unit_name;
         ColumnPtr filename_table; // from .debug_line
         size_t filename_table_size = 0;
-        uint64_t addr_base = UINT64_MAX;
+        /// Starting offset of this unit's data in .debug_addr and .debug_rnglists sections.
+        uint64_t debug_addr_base = UINT64_MAX;
         uint64_t rnglists_base = UINT64_MAX;
+        /// "Base address" for parsing range lists. Not to be confused with "addr base".
+        uint64_t base_address = UINT64_MAX;
 
         uint64_t offset = 0;
         std::vector<StackEntry> stack;
@@ -102,11 +105,18 @@ private:
     void parseFilenameTable(UnitState & unit, uint64_t offset);
     Chunk parseEntries(UnitState & unit);
 
+    llvm::DWARFFormValue parseAttribute(
+        const llvm::DWARFAbbreviationDeclaration::AttributeSpec & attr, uint64_t * offset,
+        const UnitState & unit) const;
+    void skipAttribute(
+        const llvm::DWARFAbbreviationDeclaration::AttributeSpec & attr, uint64_t * offset,
+        const UnitState & unit) const;
+    uint64_t parseAddress(llvm::dwarf::Attribute attr, const llvm::DWARFFormValue & val, const UnitState & unit);
     /// Parse .debug_addr entry.
     uint64_t fetchFromDebugAddr(uint64_t addr_base, uint64_t idx) const;
     /// Parse .debug_ranges (DWARF4) or .debug_rnglists (DWARF5) entry.
     void parseRanges(
-        uint64_t offset, bool form_rnglistx, std::optional<uint64_t> low_pc, const UnitState & unit,
+        uint64_t offset, bool form_rnglistx, const UnitState & unit,
         const ColumnVector<UInt64>::MutablePtr & col_ranges_start,
         const ColumnVector<UInt64>::MutablePtr & col_ranges_end) const;
 };
diff --git a/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.cpp
index f6bd4f51289..f57e62adba9 100644
--- a/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.cpp
@@ -27,12 +27,18 @@ JSONAsRowInputFormat::JSONAsRowInputFormat(const Block & header_, std::unique_pt
             header_.columns());
 }
 
-void JSONAsRowInputFormat::resetParser()
+
+void JSONAsRowInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    JSONEachRowRowInputFormat::resetParser();
-    buf->reset();
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    JSONEachRowRowInputFormat::setReadBuffer(*buf);
 }
 
+void JSONAsRowInputFormat::resetReadBuffer()
+{
+    buf.reset();
+    JSONEachRowRowInputFormat::resetReadBuffer();
+}
 
 bool JSONAsRowInputFormat::readRow(MutableColumns & columns, RowReadExtension &)
 {
@@ -68,12 +74,6 @@ bool JSONAsRowInputFormat::readRow(MutableColumns & columns, RowReadExtension &)
     return !buf->eof();
 }
 
-void JSONAsRowInputFormat::setReadBuffer(ReadBuffer & in_)
-{
-    buf->setSubBuffer(in_);
-}
-
-
 JSONAsStringRowInputFormat::JSONAsStringRowInputFormat(
     const Block & header_, ReadBuffer & in_, Params params_, const FormatSettings & format_settings_)
     : JSONAsRowInputFormat(header_, in_, params_, format_settings_)
@@ -91,7 +91,7 @@ void JSONAsStringRowInputFormat::readJSONObject(IColumn & column)
     bool quotes = false;
 
     if (*buf->position() != '{')
-        throw Exception(ErrorCodes::INCORRECT_DATA, "JSON object must begin with '{'.");
+        throw Exception(ErrorCodes::INCORRECT_DATA, "JSON object must begin with '{{'.");
 
     ++buf->position();
     ++balance;
diff --git a/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.h b/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.h
index 4312a853193..e90dae31afd 100644
--- a/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONAsStringRowInputFormat.h
@@ -18,8 +18,8 @@ class JSONAsRowInputFormat : public JSONEachRowRowInputFormat
 public:
     JSONAsRowInputFormat(const Block & header_, ReadBuffer & in_, Params params_, const FormatSettings & format_settings);
 
-    void resetParser() override;
     void setReadBuffer(ReadBuffer & in_) override;
+    void resetReadBuffer() override;
 
 private:
     JSONAsRowInputFormat(const Block & header_, std::unique_ptr<PeekableReadBuffer> buf_, Params params_, const FormatSettings & format_settings);
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
index 26bd0847fb7..53cb5a77898 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.cpp
@@ -109,7 +109,7 @@ void JSONColumnsBlockInputFormatBase::setReadBuffer(ReadBuffer & in_)
     IInputFormat::setReadBuffer(in_);
 }
 
-Chunk JSONColumnsBlockInputFormatBase::generate()
+Chunk JSONColumnsBlockInputFormatBase::read()
 {
     MutableColumns columns = getPort().getHeader().cloneEmptyColumns();
     block_missing_values.clear();
@@ -230,6 +230,11 @@ void JSONColumnsSchemaReaderBase::transformTypesIfNeeded(DataTypePtr & type, Dat
     transformInferredJSONTypesIfNeeded(type, new_type, format_settings, &inference_info);
 }
 
+void JSONColumnsSchemaReaderBase::transformTypesFromDifferentFilesIfNeeded(DataTypePtr & type, DataTypePtr & new_type)
+{
+    transformInferredJSONTypesFromDifferentFilesIfNeeded(type, new_type, format_settings);
+}
+
 NamesAndTypesList JSONColumnsSchemaReaderBase::readSchema()
 {
     std::unordered_map<String, DataTypePtr> names_to_types;
diff --git a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
index bb52e2aa516..fe80d77cd87 100644
--- a/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
+++ b/src/Processors/Formats/Impl/JSONColumnsBlockInputFormatBase.h
@@ -56,7 +56,7 @@ public:
     size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
 
 protected:
-    Chunk generate() override;
+    Chunk read() override;
 
     size_t readColumn(IColumn & column, const DataTypePtr & type, const SerializationPtr & serialization, const String & column_name);
 
@@ -80,7 +80,8 @@ class JSONColumnsSchemaReaderBase : public ISchemaReader
 public:
     JSONColumnsSchemaReaderBase(ReadBuffer & in_, const FormatSettings & format_settings_, std::unique_ptr<JSONColumnsReaderBase> reader_);
 
-    void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type);
+    void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
+    void transformTypesFromDifferentFilesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
 
     bool needContext() const override { return !hints_str.empty(); }
     void setContext(ContextPtr & ctx) override;
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
index 99186d0eb6d..6fbd9d7ad22 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.cpp
@@ -60,12 +60,15 @@ void JSONCompactEachRowFormatReader::skipFieldDelimiter()
 
 void JSONCompactEachRowFormatReader::skipRowEndDelimiter()
 {
+    skipWhitespaceIfAny(*in);
     JSONUtils::skipArrayEnd(*in);
+}
 
+void JSONCompactEachRowFormatReader::skipRowBetweenDelimiter()
+{
     skipWhitespaceIfAny(*in);
     if (!in->eof() && (*in->position() == ',' || *in->position() == ';'))
         ++in->position();
-
     skipWhitespaceIfAny(*in);
 }
 
@@ -91,6 +94,10 @@ void JSONCompactEachRowFormatReader::skipHeaderRow()
 bool JSONCompactEachRowFormatReader::checkForSuffix()
 {
     skipWhitespaceIfAny(*in);
+    /// Allow ',' and ';' after the last row.
+    if (!in->eof() && (*in->position() == ',' || *in->position() == ';'))
+        ++in->position();
+    skipWhitespaceIfAny(*in);
     return in->eof();
 }
 
@@ -228,6 +235,11 @@ void JSONCompactEachRowRowSchemaReader::transformTypesIfNeeded(DataTypePtr & typ
     transformInferredJSONTypesIfNeeded(type, new_type, format_settings, &inference_info);
 }
 
+void JSONCompactEachRowRowSchemaReader::transformTypesFromDifferentFilesIfNeeded(DataTypePtr & type, DataTypePtr & new_type)
+{
+    transformInferredJSONTypesFromDifferentFilesIfNeeded(type, new_type, format_settings);
+}
+
 void JSONCompactEachRowRowSchemaReader::transformFinalTypeIfNeeded(DataTypePtr & type)
 {
     transformFinalInferredJSONTypeIfNeeded(type, format_settings, &inference_info);
diff --git a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
index 2e255a55d57..ebeb939e7fa 100644
--- a/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONCompactEachRowRowInputFormat.h
@@ -64,6 +64,7 @@ public:
     void skipRowStartDelimiter() override;
     void skipFieldDelimiter() override;
     void skipRowEndDelimiter() override;
+    void skipRowBetweenDelimiter() override;
 
     void skipRow() override;
 
@@ -92,6 +93,7 @@ private:
     std::optional<DataTypes> readRowAndGetDataTypesImpl() override;
 
     void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
+    void transformTypesFromDifferentFilesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
     void transformFinalTypeIfNeeded(DataTypePtr & type) override;
 
     JSONCompactEachRowFormatReader reader;
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
index 30b08cd1d9c..0ef19a9c14f 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.cpp
@@ -142,7 +142,7 @@ inline bool JSONEachRowRowInputFormat::advanceToNextKey(size_t key_index)
     skipWhitespaceIfAny(*in);
 
     if (in->eof())
-        throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected end of stream while parsing JSONEachRow format");
+        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected end of stream while parsing JSONEachRow format");
     else if (*in->position() == '}')
     {
         ++in->position();
@@ -205,7 +205,7 @@ bool JSONEachRowRowInputFormat::readRow(MutableColumns & columns, RowReadExtensi
         return false;
     skipWhitespaceIfAny(*in);
 
-    bool is_first_row = getCurrentUnitNumber() == 0 && getTotalRows() == 1;
+    bool is_first_row = getRowNum() == 0;
     if (checkEndOfData(is_first_row))
         return false;
 
@@ -308,7 +308,7 @@ size_t JSONEachRowRowInputFormat::countRows(size_t max_block_size)
         return 0;
 
     size_t num_rows = 0;
-    bool is_first_row = getCurrentUnitNumber() == 0 && getTotalRows() == 0;
+    bool is_first_row = getRowNum() == 0;
     skipWhitespaceIfAny(*in);
     while (num_rows < max_block_size && !checkEndOfData(is_first_row))
     {
@@ -365,6 +365,11 @@ void JSONEachRowSchemaReader::transformTypesIfNeeded(DataTypePtr & type, DataTyp
     transformInferredJSONTypesIfNeeded(type, new_type, format_settings, &inference_info);
 }
 
+void JSONEachRowSchemaReader::transformTypesFromDifferentFilesIfNeeded(DB::DataTypePtr & type, DB::DataTypePtr & new_type)
+{
+    transformInferredJSONTypesFromDifferentFilesIfNeeded(type, new_type, format_settings);
+}
+
 void JSONEachRowSchemaReader::transformFinalTypeIfNeeded(DataTypePtr & type)
 {
     transformFinalInferredJSONTypeIfNeeded(type, format_settings, &inference_info);
diff --git a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h
index ad494d07fbc..3ff1b6d317c 100644
--- a/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONEachRowRowInputFormat.h
@@ -104,6 +104,7 @@ public:
 private:
     NamesAndTypesList readRowAndGetNamesAndDataTypes(bool & eof) override;
     void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
+    void transformTypesFromDifferentFilesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
     void transformFinalTypeIfNeeded(DataTypePtr & type) override;
 
     bool first_row = true;
diff --git a/src/Processors/Formats/Impl/JSONRowInputFormat.cpp b/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
index f083a00f766..f78ce530ecb 100644
--- a/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/JSONRowInputFormat.cpp
@@ -7,11 +7,6 @@
 namespace DB
 {
 
-namespace ErrorCodes
-{
-    extern const int INCORRECT_DATA;
-}
-
 JSONRowInputFormat::JSONRowInputFormat(ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_)
     : JSONRowInputFormat(std::make_unique<PeekableReadBuffer>(in_), header_, params_, format_settings_)
 {
@@ -30,38 +25,24 @@ void JSONRowInputFormat::readPrefix()
     NamesAndTypesList names_and_types_from_metadata;
 
     /// Try to parse metadata, if failed, try to parse data as JSONEachRow format.
-    try
+    if (JSONUtils::checkAndSkipObjectStart(*peekable_buf)
+        && JSONUtils::tryReadMetadata(*peekable_buf, names_and_types_from_metadata)
+        && JSONUtils::checkAndSkipComma(*peekable_buf)
+        && JSONUtils::skipUntilFieldInObject(*peekable_buf, "data")
+        && JSONUtils::checkAndSkipArrayStart(*peekable_buf))
     {
-        JSONUtils::skipObjectStart(*peekable_buf);
-        names_and_types_from_metadata = JSONUtils::readMetadata(*peekable_buf);
-        JSONUtils::skipComma(*peekable_buf);
-        if (!JSONUtils::skipUntilFieldInObject(*peekable_buf, "data"))
-            throw Exception(ErrorCodes::INCORRECT_DATA, "Expected field \"data\" with table content");
-
-        JSONUtils::skipArrayStart(*peekable_buf);
         data_in_square_brackets = true;
+        if (validate_types_from_metadata)
+        {
+            JSONUtils::validateMetadataByHeader(names_and_types_from_metadata, getPort().getHeader());
+        }
     }
-    catch (const ParsingException &)
+    else
     {
         parse_as_json_each_row = true;
-    }
-    catch (const Exception & e)
-    {
-        if (e.code() != ErrorCodes::INCORRECT_DATA)
-            throw;
-
-        parse_as_json_each_row = true;
-    }
-
-    if (parse_as_json_each_row)
-    {
         peekable_buf->rollbackToCheckpoint();
         JSONEachRowRowInputFormat::readPrefix();
     }
-    else if (validate_types_from_metadata)
-    {
-        JSONUtils::validateMetadataByHeader(names_and_types_from_metadata, getPort().getHeader());
-    }
 }
 
 void JSONRowInputFormat::readSuffix()
@@ -79,13 +60,14 @@ void JSONRowInputFormat::readSuffix()
 
 void JSONRowInputFormat::setReadBuffer(DB::ReadBuffer & in_)
 {
-    peekable_buf->setSubBuffer(in_);
+    peekable_buf = std::make_unique<PeekableReadBuffer>(in_);
+    JSONEachRowRowInputFormat::setReadBuffer(*peekable_buf);
 }
 
-void JSONRowInputFormat::resetParser()
+void JSONRowInputFormat::resetReadBuffer()
 {
-    JSONEachRowRowInputFormat::resetParser();
-    peekable_buf->reset();
+    peekable_buf.reset();
+    JSONEachRowRowInputFormat::resetReadBuffer();
 }
 
 JSONRowSchemaReader::JSONRowSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_)
@@ -103,16 +85,12 @@ NamesAndTypesList JSONRowSchemaReader::readSchema()
     skipBOMIfExists(*peekable_buf);
     PeekableReadBufferCheckpoint checkpoint(*peekable_buf);
     /// Try to parse metadata, if failed, try to parse data as JSONEachRow format
-    try
-    {
-        JSONUtils::skipObjectStart(*peekable_buf);
-        return JSONUtils::readMetadata(*peekable_buf);
-    }
-    catch (...)
-    {
-        peekable_buf->rollbackToCheckpoint(true);
-        return JSONEachRowSchemaReader::readSchema();
-    }
+    NamesAndTypesList names_and_types;
+    if (JSONUtils::checkAndSkipObjectStart(*peekable_buf) && JSONUtils::tryReadMetadata(*peekable_buf, names_and_types))
+        return names_and_types;
+
+    peekable_buf->rollbackToCheckpoint(true);
+    return JSONEachRowSchemaReader::readSchema();
 }
 
 void registerInputFormatJSON(FormatFactory & factory)
diff --git a/src/Processors/Formats/Impl/JSONRowInputFormat.h b/src/Processors/Formats/Impl/JSONRowInputFormat.h
index 771c0b64aee..b2e1d8a3d6d 100644
--- a/src/Processors/Formats/Impl/JSONRowInputFormat.h
+++ b/src/Processors/Formats/Impl/JSONRowInputFormat.h
@@ -24,7 +24,7 @@ public:
     String getName() const override { return "JSONRowInputFormat"; }
 
     void setReadBuffer(ReadBuffer & in_) override;
-    void resetParser() override;
+    void resetReadBuffer() override;
 
 private:
     JSONRowInputFormat(
diff --git a/src/Processors/Formats/Impl/MsgPackRowInputFormat.cpp b/src/Processors/Formats/Impl/MsgPackRowInputFormat.cpp
index 7678d1d3ae2..98cbdeaaa4b 100644
--- a/src/Processors/Formats/Impl/MsgPackRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/MsgPackRowInputFormat.cpp
@@ -56,10 +56,21 @@ MsgPackRowInputFormat::MsgPackRowInputFormat(const Block & header_, std::unique_
 void MsgPackRowInputFormat::resetParser()
 {
     IRowInputFormat::resetParser();
-    buf->reset();
     visitor.reset();
 }
 
+void MsgPackRowInputFormat::setReadBuffer(ReadBuffer & in_)
+{
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    IRowInputFormat::setReadBuffer(*buf);
+}
+
+void MsgPackRowInputFormat::resetReadBuffer()
+{
+    buf.reset();
+    IRowInputFormat::resetReadBuffer();
+}
+
 void MsgPackVisitor::set_info(IColumn & column, DataTypePtr type, UInt8 & read) // NOLINT
 {
     while (!info_stack.empty())
@@ -543,11 +554,6 @@ bool MsgPackRowInputFormat::readRow(MutableColumns & columns, RowReadExtension &
     return true;
 }
 
-void MsgPackRowInputFormat::setReadBuffer(ReadBuffer & in_)
-{
-    buf->setSubBuffer(in_);
-}
-
 MsgPackSchemaReader::MsgPackSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_)
     : IRowSchemaReader(buf, format_settings_), buf(in_), number_of_columns(format_settings_.msgpack.number_of_columns)
 {
diff --git a/src/Processors/Formats/Impl/MsgPackRowInputFormat.h b/src/Processors/Formats/Impl/MsgPackRowInputFormat.h
index 3876b372670..ae2ce386665 100644
--- a/src/Processors/Formats/Impl/MsgPackRowInputFormat.h
+++ b/src/Processors/Formats/Impl/MsgPackRowInputFormat.h
@@ -69,6 +69,7 @@ public:
     String getName() const override { return "MagPackRowInputFormat"; }
     void resetParser() override;
     void setReadBuffer(ReadBuffer & in_) override;
+    void resetReadBuffer() override;
 
 private:
     MsgPackRowInputFormat(const Block & header_, std::unique_ptr<PeekableReadBuffer> buf_, Params params_, const FormatSettings & settings);
diff --git a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
index 6ae32aa5842..7e8b4accf4d 100644
--- a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.cpp
@@ -462,6 +462,11 @@ std::optional<DataTypes> MySQLDumpSchemaReader::readRowAndGetDataTypes()
     return data_types;
 }
 
+void MySQLDumpSchemaReader::transformTypesIfNeeded(DB::DataTypePtr & type, DB::DataTypePtr & new_type)
+{
+    transformInferredTypesIfNeeded(type, new_type, format_settings);
+}
+
 void registerInputFormatMySQLDump(FormatFactory & factory)
 {
     factory.registerInputFormat("MySQLDump", [](
diff --git a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.h b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.h
index 4148b6e79a3..18b403b5f9a 100644
--- a/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.h
+++ b/src/Processors/Formats/Impl/MySQLDumpRowInputFormat.h
@@ -37,6 +37,7 @@ public:
 private:
     NamesAndTypesList readSchema() override;
     std::optional<DataTypes> readRowAndGetDataTypes() override;
+    void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
 
     String table_name;
 };
diff --git a/src/Processors/Formats/Impl/MySQLOutputFormat.cpp b/src/Processors/Formats/Impl/MySQLOutputFormat.cpp
index 7148996cc1d..784aa5494ba 100644
--- a/src/Processors/Formats/Impl/MySQLOutputFormat.cpp
+++ b/src/Processors/Formats/Impl/MySQLOutputFormat.cpp
@@ -1,4 +1,5 @@
 #include <Processors/Formats/Impl/MySQLOutputFormat.h>
+#include <Common/formatReadable.h>
 #include <Core/MySQL/PacketsGeneric.h>
 #include <Core/MySQL/PacketsProtocolBinary.h>
 #include <Core/MySQL/PacketsProtocolText.h>
diff --git a/src/Processors/Formats/Impl/NativeFormat.cpp b/src/Processors/Formats/Impl/NativeFormat.cpp
index 65ea87479a3..73ffc02bbc1 100644
--- a/src/Processors/Formats/Impl/NativeFormat.cpp
+++ b/src/Processors/Formats/Impl/NativeFormat.cpp
@@ -35,7 +35,7 @@ public:
         reader->resetParser();
     }
 
-    Chunk generate() override
+    Chunk read() override
     {
         block_missing_values.clear();
         size_t block_start = getDataOffsetMaybeCompressed(*in);
diff --git a/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp b/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp
index 28cd8fdc232..2fa5c1d2850 100644
--- a/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/NativeORCBlockInputFormat.cpp
@@ -22,6 +22,7 @@
 #    include <DataTypes/DataTypesDecimal.h>
 #    include <DataTypes/DataTypesNumber.h>
 #    include <DataTypes/NestedUtils.h>
+#    include <DataTypes/DataTypeNested.h>
 #    include <Formats/FormatFactory.h>
 #    include <Formats/SchemaInferenceUtils.h>
 #    include <Formats/insertNullAsDefaultIfNeeded.h>
@@ -904,7 +905,7 @@ bool NativeORCBlockInputFormat::prepareStripeReader()
     return true;
 }
 
-Chunk NativeORCBlockInputFormat::generate()
+Chunk NativeORCBlockInputFormat::read()
 {
     block_missing_values.clear();
 
@@ -1513,8 +1514,19 @@ static ColumnWithTypeAndName readColumnFromORCColumn(
 
             auto offsets_column = readOffsetsFromORCListColumn(orc_list_column);
             auto array_column = ColumnArray::create(nested_column.column, offsets_column);
-            auto array_type = std::make_shared<DataTypeArray>(nested_column.type);
-            return {std::move(array_column), std::move(array_type), column_name};
+            DataTypePtr array_type;
+            /// If type hint is Nested, we should return Nested type,
+            /// because we differentiate Nested and simple Array(Tuple)
+            if (type_hint && isNested(type_hint))
+            {
+                const auto & tuple_type = assert_cast<const DataTypeTuple &>(*nested_column.type);
+                array_type = createNested(tuple_type.getElements(), tuple_type.getElementNames());
+            }
+            else
+            {
+                array_type = std::make_shared<DataTypeArray>(nested_column.type);
+            }
+            return {std::move(array_column), array_type, column_name};
         }
         case orc::STRUCT: {
             Columns tuple_elements;
diff --git a/src/Processors/Formats/Impl/NativeORCBlockInputFormat.h b/src/Processors/Formats/Impl/NativeORCBlockInputFormat.h
index 6ea7a063e0d..a3ef9ed4b8f 100644
--- a/src/Processors/Formats/Impl/NativeORCBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/NativeORCBlockInputFormat.h
@@ -62,7 +62,7 @@ public:
     size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
 
 protected:
-    Chunk generate() override;
+    Chunk read() override;
 
     void onCancel() override { is_stopped = 1; }
 
diff --git a/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp b/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp
index 5cde51a4927..a41eacf26b7 100644
--- a/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ORCBlockInputFormat.cpp
@@ -27,7 +27,7 @@ ORCBlockInputFormat::ORCBlockInputFormat(ReadBuffer & in_, Block header_, const
 {
 }
 
-Chunk ORCBlockInputFormat::generate()
+Chunk ORCBlockInputFormat::read()
 {
     block_missing_values.clear();
 
@@ -48,7 +48,7 @@ Chunk ORCBlockInputFormat::generate()
 
     auto batch_result = file_reader->ReadStripe(stripe_current, include_indices);
     if (!batch_result.ok())
-        throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Failed to create batch reader: {}", batch_result.status().ToString());
+        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Failed to create batch reader: {}", batch_result.status().ToString());
 
     auto batch = batch_result.ValueOrDie();
     if (!batch)
@@ -56,7 +56,7 @@ Chunk ORCBlockInputFormat::generate()
 
     auto table_result = arrow::Table::FromRecordBatches({batch});
     if (!table_result.ok())
-        throw ParsingException(
+        throw Exception(
             ErrorCodes::CANNOT_READ_ALL_DATA, "Error while reading batch of ORC data: {}", table_result.status().ToString());
 
     /// We should extract the number of rows directly from the stripe, because in case when
diff --git a/src/Processors/Formats/Impl/ORCBlockInputFormat.h b/src/Processors/Formats/Impl/ORCBlockInputFormat.h
index 4d878f85255..34630345849 100644
--- a/src/Processors/Formats/Impl/ORCBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ORCBlockInputFormat.h
@@ -32,7 +32,7 @@ public:
     size_t getApproxBytesReadForChunk() const override { return approx_bytes_read_for_chunk; }
 
 protected:
-    Chunk generate() override;
+    Chunk read() override;
 
     void onCancel() override
     {
diff --git a/src/Processors/Formats/Impl/OneFormat.cpp b/src/Processors/Formats/Impl/OneFormat.cpp
index 4a9c8caebf3..f190cce6425 100644
--- a/src/Processors/Formats/Impl/OneFormat.cpp
+++ b/src/Processors/Formats/Impl/OneFormat.cpp
@@ -23,7 +23,7 @@ OneInputFormat::OneInputFormat(const Block & header, ReadBuffer & in_) : IInputF
                         header.getByPosition(0).type->getName());
 }
 
-Chunk OneInputFormat::generate()
+Chunk OneInputFormat::read()
 {
     if (done)
         return {};
diff --git a/src/Processors/Formats/Impl/OneFormat.h b/src/Processors/Formats/Impl/OneFormat.h
index f73b2dab66a..060b9b21def 100644
--- a/src/Processors/Formats/Impl/OneFormat.h
+++ b/src/Processors/Formats/Impl/OneFormat.h
@@ -14,7 +14,7 @@ public:
     String getName() const override { return "One"; }
 
 protected:
-    Chunk generate() override;
+    Chunk read() override;
 
 private:
     bool done = false;
diff --git a/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp b/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
index 1bc8f23bd19..8b6969bbfcc 100644
--- a/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParallelParsingInputFormat.cpp
@@ -61,7 +61,7 @@ void ParallelParsingInputFormat::segmentatorThreadFunction(ThreadGroupPtr thread
     }
     catch (...)
     {
-        onBackgroundException(successfully_read_rows_count);
+        onBackgroundException();
     }
 }
 
@@ -90,7 +90,7 @@ void ParallelParsingInputFormat::parserThreadFunction(ThreadGroupPtr thread_grou
         ReadBuffer read_buffer(unit.segment.data(), unit.segment.size(), 0);
 
         InputFormatPtr input_format = internal_parser_creator(read_buffer);
-        input_format->setCurrentUnitNumber(current_ticket_number);
+        input_format->setRowsReadBefore(unit.offset);
         input_format->setErrorsLogger(errors_logger);
         InternalParser parser(input_format);
 
@@ -126,38 +126,22 @@ void ParallelParsingInputFormat::parserThreadFunction(ThreadGroupPtr thread_grou
             first_parser_finished.set();
         }
 
-        // We suppose we will get at least some blocks for a non-empty buffer,
-        // except at the end of file. Also see a matching assert in readImpl().
-        assert(unit.is_last || !unit.chunk_ext.chunk.empty() || parsing_finished);
-
         std::lock_guard<std::mutex> lock(mutex);
         unit.status = READY_TO_READ;
         reader_condvar.notify_all();
     }
     catch (...)
     {
-        onBackgroundException(unit.offset);
+        onBackgroundException();
     }
 }
 
 
-void ParallelParsingInputFormat::onBackgroundException(size_t offset)
+void ParallelParsingInputFormat::onBackgroundException()
 {
     std::lock_guard lock(mutex);
     if (!background_exception)
-    {
         background_exception = std::current_exception();
-        if (ParsingException * e = exception_cast<ParsingException *>(background_exception))
-        {
-            /// NOTE: it is not that safe to use line number hack here (may exceed INT_MAX)
-            if (e->getLineNumber() != -1)
-                e->setLineNumber(static_cast<int>(e->getLineNumber() + offset));
-
-            auto file_name = getFileNameFromReadBuffer(getReadBuffer());
-            if (!file_name.empty())
-                e->setFileName(file_name);
-        }
-    }
 
     if (is_server)
         tryLogCurrentException(__PRETTY_FUNCTION__);
@@ -168,7 +152,7 @@ void ParallelParsingInputFormat::onBackgroundException(size_t offset)
     segmentator_condvar.notify_all();
 }
 
-Chunk ParallelParsingInputFormat::generate()
+Chunk ParallelParsingInputFormat::read()
 {
     /// Delayed launching of segmentator thread
     if (unlikely(!parsing_started.exchange(true)))
@@ -200,62 +184,69 @@ Chunk ParallelParsingInputFormat::generate()
     }
 
     const auto inserter_unit_number = reader_ticket_number % processing_units.size();
-    auto & unit = processing_units[inserter_unit_number];
+    auto * unit = &processing_units[inserter_unit_number];
 
     if (!next_block_in_current_unit.has_value())
     {
-        // We have read out all the Blocks from the previous Processing Unit,
-        // wait for the current one to become ready.
-        std::unique_lock<std::mutex> lock(mutex);
-        reader_condvar.wait(lock, [&](){ return unit.status == READY_TO_READ || parsing_finished; });
-
-        if (parsing_finished)
+        while (true)
         {
-            /**
-              * Check for background exception and rethrow it before we return.
-              */
-            if (background_exception)
+            // We have read out all the Blocks from the previous Processing Unit,
+            // wait for the current one to become ready.
+            std::unique_lock<std::mutex> lock(mutex);
+            reader_condvar.wait(lock, [&]() { return unit->status == READY_TO_READ || parsing_finished; });
+
+            if (parsing_finished)
             {
-                lock.unlock();
-                cancel();
-                std::rethrow_exception(background_exception);
+                /// Check for background exception and rethrow it before we return.
+                if (background_exception)
+                {
+                    lock.unlock();
+                    cancel();
+                    std::rethrow_exception(background_exception);
+                }
+
+                return {};
             }
 
-            return {};
+            assert(unit->status == READY_TO_READ);
+
+            if (!unit->chunk_ext.chunk.empty())
+                break;
+
+            /// If this uint is last, parsing is finished.
+            if (unit->is_last)
+            {
+                parsing_finished = true;
+                return {};
+            }
+
+            /// We can get zero blocks for an entire segment if format parser
+            /// skipped all rows. For example, it can happen while using settings
+            /// input_format_allow_errors_num/input_format_allow_errors_ratio
+            /// and this segment contained only rows with errors.
+            /// Process the next unit.
+            ++reader_ticket_number;
+            unit = &processing_units[reader_ticket_number % processing_units.size()];
         }
 
-        assert(unit.status == READY_TO_READ);
         next_block_in_current_unit = 0;
     }
 
-    if (unit.chunk_ext.chunk.empty())
-    {
-        /*
-         * Can we get zero blocks for an entire segment, when the format parser
-         * skips it entire content and does not create any blocks? Probably not,
-         * but if we ever do, we should add a loop around the above if, to skip
-         * these. Also see a matching assert in the parser thread.
-         */
-        assert(unit.is_last);
-        parsing_finished = true;
-        return {};
-    }
+    assert(next_block_in_current_unit.value() < unit->chunk_ext.chunk.size());
 
-    assert(next_block_in_current_unit.value() < unit.chunk_ext.chunk.size());
-
-    Chunk res = std::move(unit.chunk_ext.chunk.at(*next_block_in_current_unit));
-    last_block_missing_values = std::move(unit.chunk_ext.block_missing_values[*next_block_in_current_unit]);
-    last_approx_bytes_read_for_chunk = unit.chunk_ext.approx_chunk_sizes.at(*next_block_in_current_unit);
+    Chunk res = std::move(unit->chunk_ext.chunk.at(*next_block_in_current_unit));
+    last_block_missing_values = std::move(unit->chunk_ext.block_missing_values[*next_block_in_current_unit]);
+    last_approx_bytes_read_for_chunk = unit->chunk_ext.approx_chunk_sizes.at(*next_block_in_current_unit);
 
     next_block_in_current_unit.value() += 1;
 
-    if (*next_block_in_current_unit == unit.chunk_ext.chunk.size())
+    if (*next_block_in_current_unit == unit->chunk_ext.chunk.size())
     {
         // parsing_finished reading this Processing Unit, move to the next one.
         next_block_in_current_unit.reset();
         ++reader_ticket_number;
 
-        if (unit.is_last)
+        if (unit->is_last)
         {
             // It it was the last unit, we're parsing_finished.
             parsing_finished = true;
@@ -264,7 +255,7 @@ Chunk ParallelParsingInputFormat::generate()
         {
             // Pass the unit back to the segmentator.
             std::lock_guard lock(mutex);
-            unit.status = READY_TO_INSERT;
+            unit->status = READY_TO_INSERT;
             segmentator_condvar.notify_all();
         }
     }
diff --git a/src/Processors/Formats/Impl/ParallelParsingInputFormat.h b/src/Processors/Formats/Impl/ParallelParsingInputFormat.h
index 8432e053eba..ff97afa8348 100644
--- a/src/Processors/Formats/Impl/ParallelParsingInputFormat.h
+++ b/src/Processors/Formats/Impl/ParallelParsingInputFormat.h
@@ -135,7 +135,7 @@ public:
 
 private:
 
-    Chunk generate() override final;
+    Chunk read() override final;
 
     void onCancel() override final
     {
@@ -333,7 +333,7 @@ private:
     /// threads. This function is used by segmentator and parsed threads.
     /// readImpl() is called from the main thread, so the exception handling
     /// is different.
-    void onBackgroundException(size_t offset);
+    void onBackgroundException();
 };
 
 }
diff --git a/src/Processors/Formats/Impl/Parquet/Write.cpp b/src/Processors/Formats/Impl/Parquet/Write.cpp
index 82e761f43e2..6d8f1ab55cb 100644
--- a/src/Processors/Formats/Impl/Parquet/Write.cpp
+++ b/src/Processors/Formats/Impl/Parquet/Write.cpp
@@ -13,6 +13,7 @@
 #include <Columns/ColumnMap.h>
 #include <IO/WriteHelpers.h>
 #include <Common/config_version.h>
+#include <Common/formatReadable.h>
 
 #if USE_SNAPPY
 #include <snappy.h>
diff --git a/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp b/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
index d37c2dc1160..62e576d4953 100644
--- a/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParquetBlockInputFormat.cpp
@@ -570,7 +570,7 @@ void ParquetBlockInputFormat::decodeOneChunk(size_t row_group_batch_idx, std::un
 
         // We may be able to schedule more work now, but can't call scheduleMoreWorkIfNeeded() right
         // here because we're running on the same thread pool, so it'll deadlock if thread limit is
-        // reached. Wake up generate() instead.
+        // reached. Wake up read() instead.
         condvar.notify_all();
     };
 
@@ -579,7 +579,7 @@ void ParquetBlockInputFormat::decodeOneChunk(size_t row_group_batch_idx, std::un
 
     auto batch = row_group_batch.record_batch_reader->Next();
     if (!batch.ok())
-        throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while reading Parquet data: {}", batch.status().ToString());
+        throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Error while reading Parquet data: {}", batch.status().ToString());
 
     if (!*batch)
     {
@@ -637,7 +637,7 @@ void ParquetBlockInputFormat::scheduleMoreWorkIfNeeded(std::optional<size_t> row
     }
 }
 
-Chunk ParquetBlockInputFormat::generate()
+Chunk ParquetBlockInputFormat::read()
 {
     initializeIfNeeded();
 
diff --git a/src/Processors/Formats/Impl/ParquetBlockInputFormat.h b/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
index 7fdf03a0606..b5b884b5efa 100644
--- a/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ParquetBlockInputFormat.h
@@ -65,7 +65,7 @@ public:
     size_t getApproxBytesReadForChunk() const override { return previous_approx_bytes_read_for_chunk; }
 
 private:
-    Chunk generate() override;
+    Chunk read() override;
 
     void onCancel() override
     {
@@ -142,7 +142,7 @@ private:
     // reading its data (using RAM). Row group becomes inactive when we finish reading and
     // delivering all its blocks and free the RAM. Size of the window is max_decoding_threads.
     //
-    // Decoded blocks are placed in `pending_chunks` queue, then picked up by generate().
+    // Decoded blocks are placed in `pending_chunks` queue, then picked up by read().
     // If row group decoding runs too far ahead of delivery (by `max_pending_chunks_per_row_group`
     // chunks), we pause the stream for the row group, to avoid using too much memory when decoded
     // chunks are much bigger than the compressed data.
@@ -150,7 +150,7 @@ private:
     // Also:
     //  * If preserve_order = true, we deliver chunks strictly in order of increasing row group.
     //    Decoding may still proceed in later row groups.
-    //  * If max_decoding_threads <= 1, we run all tasks inline in generate(), without thread pool.
+    //  * If max_decoding_threads <= 1, we run all tasks inline in read(), without thread pool.
 
     // Potential improvements:
     //  * Plan all read ranges ahead of time, for the whole file, and do prefetching for them
@@ -189,7 +189,7 @@ private:
 
         Status status = Status::NotStarted;
 
-        // Window of chunks that were decoded but not returned from generate():
+        // Window of chunks that were decoded but not returned from read():
         //
         // (delivered)            next_chunk_idx
         //   v   v                       v
@@ -215,7 +215,7 @@ private:
         std::unique_ptr<ArrowColumnToCHColumn> arrow_column_to_ch_column;
     };
 
-    // Chunk ready to be delivered by generate().
+    // Chunk ready to be delivered by read().
     struct PendingChunk
     {
         Chunk chunk;
@@ -265,7 +265,7 @@ private:
     //    Done                        NotStarted
 
     std::mutex mutex;
-    // Wakes up the generate() call, if any.
+    // Wakes up the read() call, if any.
     std::condition_variable condvar;
 
     std::vector<RowGroupBatchState> row_group_batches;
diff --git a/src/Processors/Formats/Impl/ParquetMetadataInputFormat.cpp b/src/Processors/Formats/Impl/ParquetMetadataInputFormat.cpp
index 1f81f5ac201..7fd6e93dd80 100644
--- a/src/Processors/Formats/Impl/ParquetMetadataInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ParquetMetadataInputFormat.cpp
@@ -140,7 +140,7 @@ ParquetMetadataInputFormat::ParquetMetadataInputFormat(ReadBuffer & in_, Block h
     checkHeader(getPort().getHeader());
 }
 
-Chunk ParquetMetadataInputFormat::generate()
+Chunk ParquetMetadataInputFormat::read()
 {
     Chunk res;
     if (done)
diff --git a/src/Processors/Formats/Impl/ParquetMetadataInputFormat.h b/src/Processors/Formats/Impl/ParquetMetadataInputFormat.h
index 2d027e5000f..1aa2d99ca76 100644
--- a/src/Processors/Formats/Impl/ParquetMetadataInputFormat.h
+++ b/src/Processors/Formats/Impl/ParquetMetadataInputFormat.h
@@ -63,7 +63,7 @@ public:
     void resetParser() override;
 
 private:
-    Chunk generate() override;
+    Chunk read() override;
 
     void onCancel() override
     {
diff --git a/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp b/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp
index 220a24b3c8c..2382b3cf27a 100644
--- a/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ProtobufListInputFormat.cpp
@@ -61,7 +61,7 @@ bool ProtobufListInputFormat::readRow(MutableColumns & columns, RowReadExtension
 
 size_t ProtobufListInputFormat::countRows(size_t max_block_size)
 {
-    if (getTotalRows() == 0)
+    if (getRowNum() == 0)
         reader->startMessage(true);
 
     if (reader->eof())
diff --git a/src/Processors/Formats/Impl/RegexpRowInputFormat.cpp b/src/Processors/Formats/Impl/RegexpRowInputFormat.cpp
index e59746fee62..4fc62afa125 100644
--- a/src/Processors/Formats/Impl/RegexpRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/RegexpRowInputFormat.cpp
@@ -84,10 +84,16 @@ RegexpRowInputFormat::RegexpRowInputFormat(
 {
 }
 
-void RegexpRowInputFormat::resetParser()
+void RegexpRowInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    IRowInputFormat::resetParser();
-    buf->reset();
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    IRowInputFormat::setReadBuffer(*buf);
+}
+
+void RegexpRowInputFormat::resetReadBuffer()
+{
+    buf.reset();
+    IRowInputFormat::resetReadBuffer();
 }
 
 bool RegexpRowInputFormat::readField(size_t index, MutableColumns & columns)
@@ -128,11 +134,6 @@ bool RegexpRowInputFormat::readRow(MutableColumns & columns, RowReadExtension &
     return true;
 }
 
-void RegexpRowInputFormat::setReadBuffer(ReadBuffer & in_)
-{
-    buf->setSubBuffer(in_);
-}
-
 RegexpSchemaReader::RegexpSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_)
     : IRowSchemaReader(
         buf,
diff --git a/src/Processors/Formats/Impl/RegexpRowInputFormat.h b/src/Processors/Formats/Impl/RegexpRowInputFormat.h
index e4a34f3c4f2..c32e08dad52 100644
--- a/src/Processors/Formats/Impl/RegexpRowInputFormat.h
+++ b/src/Processors/Formats/Impl/RegexpRowInputFormat.h
@@ -61,8 +61,8 @@ public:
     RegexpRowInputFormat(ReadBuffer & in_, const Block & header_, Params params_, const FormatSettings & format_settings_);
 
     String getName() const override { return "RegexpRowInputFormat"; }
-    void resetParser() override;
     void setReadBuffer(ReadBuffer & in_) override;
+    void resetReadBuffer() override;
 
 private:
     RegexpRowInputFormat(std::unique_ptr<PeekableReadBuffer> buf_, const Block & header_, Params params_, const FormatSettings & format_settings_);
@@ -90,7 +90,6 @@ private:
 
     void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
 
-
     using EscapingRule = FormatSettings::EscapingRule;
     RegexpFieldExtractor field_extractor;
     PeekableReadBuffer buf;
diff --git a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
index f4f92583473..432e944a246 100644
--- a/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TSKVRowInputFormat.cpp
@@ -92,7 +92,7 @@ static bool readName(ReadBuffer & buf, StringRef & ref, String & tmp)
         }
     }
 
-    throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected end of stream while reading key name from TSKV format");
+    throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected end of stream while reading key name from TSKV format");
 }
 
 
@@ -161,7 +161,7 @@ bool TSKVRowInputFormat::readRow(MutableColumns & columns, RowReadExtension & ex
 
             if (in->eof())
             {
-                throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected end of stream after field in TSKV format: {}", name_ref.toString());
+                throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected end of stream after field in TSKV format: {}", name_ref.toString());
             }
             else if (*in->position() == '\t')
             {
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
index 3205adc2a48..6f6dae334e5 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.cpp
@@ -67,13 +67,14 @@ TabSeparatedRowInputFormat::TabSeparatedRowInputFormat(
 
 void TabSeparatedRowInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    buf->setSubBuffer(in_);
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    RowInputFormatWithNamesAndTypes::setReadBuffer(*buf);
 }
 
-void TabSeparatedRowInputFormat::resetParser()
+void TabSeparatedRowInputFormat::resetReadBuffer()
 {
-    RowInputFormatWithNamesAndTypes::resetParser();
-    buf->reset();
+    buf.reset();
+    RowInputFormatWithNamesAndTypes::resetReadBuffer();
 }
 
 TabSeparatedFormatReader::TabSeparatedFormatReader(PeekableReadBuffer & in_, const FormatSettings & format_settings_, bool is_raw_)
diff --git a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
index d84e8f3e0ac..00a270e9611 100644
--- a/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
+++ b/src/Processors/Formats/Impl/TabSeparatedRowInputFormat.h
@@ -23,7 +23,7 @@ public:
     String getName() const override { return "TabSeparatedRowInputFormat"; }
 
     void setReadBuffer(ReadBuffer & in_) override;
-    void resetParser() override;
+    void resetReadBuffer() override;
 
 private:
     TabSeparatedRowInputFormat(const Block & header_, std::unique_ptr<PeekableReadBuffer> in_, const Params & params_,
diff --git a/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp b/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp
index b065e00f5d1..a6e4600d83b 100644
--- a/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp
+++ b/src/Processors/Formats/Impl/TemplateRowInputFormat.cpp
@@ -21,7 +21,7 @@ namespace ErrorCodes
 
 [[noreturn]] static void throwUnexpectedEof(size_t row_num)
 {
-    throw ParsingException(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected EOF while parsing row {}. "
+    throw Exception(ErrorCodes::CANNOT_READ_ALL_DATA, "Unexpected EOF while parsing row {}. "
                            "Maybe last row has wrong format or input doesn't contain specified suffix before EOF.",
                            std::to_string(row_num));
 }
@@ -121,7 +121,7 @@ bool TemplateRowInputFormat::readRow(MutableColumns & columns, RowReadExtension
 
     updateDiagnosticInfo();
 
-    if (likely(row_num != 1))
+    if (likely(getRowNum() != 0))
         format_reader->skipRowBetweenDelimiter();
 
     extra.read_columns.assign(columns.size(), false);
@@ -160,7 +160,7 @@ bool TemplateRowInputFormat::deserializeField(const DataTypePtr & type,
     catch (Exception & e)
     {
         if (e.code() == ErrorCodes::ATTEMPT_TO_READ_AFTER_EOF)
-            throwUnexpectedEof(row_num);
+            throwUnexpectedEof(getRowNum());
         throw;
     }
 }
@@ -198,7 +198,7 @@ bool TemplateRowInputFormat::parseRowAndPrintDiagnosticInfo(MutableColumns & col
 
     out << "\nUsing format string (from format_schema_rows): " << row_format.dump() << "\n";
     out << "\nTrying to parse next row, because suffix does not match:\n";
-    if (likely(row_num != 1) && !parseDelimiterWithDiagnosticInfo(out, *buf, row_between_delimiter, "delimiter between rows", ignore_spaces))
+    if (likely(getRowNum() != 0) && !parseDelimiterWithDiagnosticInfo(out, *buf, row_between_delimiter, "delimiter between rows", ignore_spaces))
         return false;
 
     for (size_t i = 0; i < row_format.columnsCount(); ++i)
@@ -288,12 +288,19 @@ void TemplateRowInputFormat::resetParser()
 {
     RowInputFormatWithDiagnosticInfo::resetParser();
     end_of_stream = false;
-    buf->reset();
 }
 
 void TemplateRowInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    buf->setSubBuffer(in_);
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    RowInputFormatWithDiagnosticInfo::setReadBuffer(*buf);
+    format_reader->setReadBuffer(*buf);
+}
+
+void TemplateRowInputFormat::resetReadBuffer()
+{
+    buf.reset();
+    RowInputFormatWithDiagnosticInfo::resetReadBuffer();
 }
 
 TemplateFormatReader::TemplateFormatReader(
diff --git a/src/Processors/Formats/Impl/TemplateRowInputFormat.h b/src/Processors/Formats/Impl/TemplateRowInputFormat.h
index 2752cb13e50..38870473289 100644
--- a/src/Processors/Formats/Impl/TemplateRowInputFormat.h
+++ b/src/Processors/Formats/Impl/TemplateRowInputFormat.h
@@ -28,6 +28,8 @@ public:
     String getName() const override { return "TemplateRowInputFormat"; }
 
     void resetParser() override;
+    void setReadBuffer(ReadBuffer & in_) override;
+    void resetReadBuffer() override;
 
 private:
     TemplateRowInputFormat(const Block & header_, std::unique_ptr<PeekableReadBuffer> buf_, const Params & params_,
@@ -50,8 +52,6 @@ private:
 
     bool isGarbageAfterField(size_t after_col_idx, ReadBuffer::Position pos) override;
 
-    void setReadBuffer(ReadBuffer & in_) override;
-
     std::unique_ptr<PeekableReadBuffer> buf;
     const DataTypes data_types;
 
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
index b0ee2f7797a..aa193ffd36a 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.cpp
@@ -98,7 +98,7 @@ bool ValuesBlockInputFormat::skipToNextRow(ReadBuffer * buf, size_t min_chunk_by
     return true;
 }
 
-Chunk ValuesBlockInputFormat::generate()
+Chunk ValuesBlockInputFormat::read()
 {
     if (total_rows == 0)
         readPrefix();
@@ -642,13 +642,19 @@ void ValuesBlockInputFormat::resetParser()
     IInputFormat::resetParser();
     // I'm not resetting parser modes here.
     // There is a good chance that all messages have the same format.
-    buf->reset();
     total_rows = 0;
 }
 
 void ValuesBlockInputFormat::setReadBuffer(ReadBuffer & in_)
 {
-    buf->setSubBuffer(in_);
+    buf = std::make_unique<PeekableReadBuffer>(in_);
+    IInputFormat::setReadBuffer(*buf);
+}
+
+void ValuesBlockInputFormat::resetReadBuffer()
+{
+    buf.reset();
+    IInputFormat::resetReadBuffer();
 }
 
 ValuesSchemaReader::ValuesSchemaReader(ReadBuffer & in_, const FormatSettings & format_settings_)
@@ -701,6 +707,11 @@ std::optional<DataTypes> ValuesSchemaReader::readRowAndGetDataTypes()
     return data_types;
 }
 
+void ValuesSchemaReader::transformTypesIfNeeded(DB::DataTypePtr & type, DB::DataTypePtr & new_type)
+{
+    transformInferredTypesIfNeeded(type, new_type, format_settings);
+}
+
 void registerInputFormatValues(FormatFactory & factory)
 {
     factory.registerInputFormat("Values", [](
diff --git a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
index e8c3b555994..bf2765bfd1e 100644
--- a/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
+++ b/src/Processors/Formats/Impl/ValuesBlockInputFormat.h
@@ -34,6 +34,7 @@ public:
 
     void resetParser() override;
     void setReadBuffer(ReadBuffer & in_) override;
+    void resetReadBuffer() override;
 
     /// TODO: remove context somehow.
     void setContext(ContextPtr & context_) { context = Context::createCopy(context_); }
@@ -57,7 +58,7 @@ private:
 
     using ConstantExpressionTemplates = std::vector<std::optional<ConstantExpressionTemplate>>;
 
-    Chunk generate() override;
+    Chunk read() override;
 
     void readRow(MutableColumns & columns, size_t row_num);
     void readUntilTheEndOfRowAndReTokenize(size_t current_column_idx);
@@ -111,6 +112,7 @@ public:
 
 private:
     std::optional<DataTypes> readRowAndGetDataTypes() override;
+    void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
 
     PeekableReadBuffer buf;
     ParserExpression parser;
diff --git a/src/Processors/Formats/InputFormatErrorsLogger.cpp b/src/Processors/Formats/InputFormatErrorsLogger.cpp
index 71d51f0e04a..814c4679cf9 100644
--- a/src/Processors/Formats/InputFormatErrorsLogger.cpp
+++ b/src/Processors/Formats/InputFormatErrorsLogger.cpp
@@ -20,7 +20,7 @@ namespace
     const String DEFAULT_OUTPUT_FORMAT = "CSV";
 }
 
-InputFormatErrorsLogger::InputFormatErrorsLogger(const ContextPtr & context)
+InputFormatErrorsLogger::InputFormatErrorsLogger(const ContextPtr & context) : max_block_size(context->getSettingsRef().max_block_size)
 {
     String output_format = context->getSettingsRef().errors_output_format;
     if (!FormatFactory::instance().isOutputFormat(output_format))
@@ -59,30 +59,47 @@ InputFormatErrorsLogger::InputFormatErrorsLogger(const ContextPtr & context)
         {std::make_shared<DataTypeUInt32>(), "offset"},
         {std::make_shared<DataTypeString>(), "reason"},
         {std::make_shared<DataTypeString>(), "raw_data"}};
+    errors_columns = header.cloneEmptyColumns();
 
     writer = context->getOutputFormat(output_format, *write_buf, header);
 }
 
+
 InputFormatErrorsLogger::~InputFormatErrorsLogger()
 {
-    writer->finalize();
-    writer->flush();
-    write_buf->finalize();
+    try
+    {
+        if (!errors_columns[0]->empty())
+            writeErrors();
+        writer->finalize();
+        writer->flush();
+        write_buf->finalize();
+    }
+    catch (...)
+    {
+        tryLogCurrentException("InputFormatErrorsLogger");
+    }
 }
 
 void InputFormatErrorsLogger::logErrorImpl(ErrorEntry entry)
 {
-    auto error = header.cloneEmpty();
-    auto columns = error.mutateColumns();
-    columns[0]->insert(entry.time);
-    database.empty() ? columns[1]->insertDefault() : columns[1]->insert(database);
-    table.empty() ? columns[2]->insertDefault() : columns[2]->insert(table);
-    columns[3]->insert(entry.offset);
-    columns[4]->insert(entry.reason);
-    columns[5]->insert(entry.raw_data);
-    error.setColumns(std::move(columns));
+    errors_columns[0]->insert(entry.time);
+    database.empty() ? errors_columns[1]->insertDefault() : errors_columns[1]->insert(database);
+    table.empty() ? errors_columns[2]->insertDefault() : errors_columns[2]->insert(table);
+    errors_columns[3]->insert(entry.offset);
+    errors_columns[4]->insert(entry.reason);
+    errors_columns[5]->insert(entry.raw_data);
 
-    writer->write(error);
+    if (errors_columns[0]->size() >= max_block_size)
+        writeErrors();
+}
+
+void InputFormatErrorsLogger::writeErrors()
+{
+    auto block = header.cloneEmpty();
+    block.setColumns(std::move(errors_columns));
+    writer->write(block);
+    errors_columns = header.cloneEmptyColumns();
 }
 
 void InputFormatErrorsLogger::logError(ErrorEntry entry)
diff --git a/src/Processors/Formats/InputFormatErrorsLogger.h b/src/Processors/Formats/InputFormatErrorsLogger.h
index 4b3766f4d37..b30246ff705 100644
--- a/src/Processors/Formats/InputFormatErrorsLogger.h
+++ b/src/Processors/Formats/InputFormatErrorsLogger.h
@@ -24,6 +24,7 @@ public:
 
     virtual void logError(ErrorEntry entry);
     void logErrorImpl(ErrorEntry entry);
+    void writeErrors();
 
 private:
     Block header;
@@ -34,6 +35,9 @@ private:
 
     String database;
     String table;
+
+    MutableColumns errors_columns;
+    size_t max_block_size;
 };
 
 using InputFormatErrorsLoggerPtr = std::shared_ptr<InputFormatErrorsLogger>;
diff --git a/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h b/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
index 4c5c3ef72e9..6c931d7793e 100644
--- a/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
+++ b/src/Processors/Formats/OutputFormatWithUTF8ValidationAdaptor.h
@@ -45,7 +45,6 @@ public:
 
     void resetFormatterImpl() override
     {
-        LOG_DEBUG(&Poco::Logger::get("RowOutputFormatWithExceptionHandlerAdaptor"), "resetFormatterImpl");
         Base::resetFormatterImpl();
         if (validating_ostr)
             validating_ostr = std::make_unique<WriteBufferValidUTF8>(*Base::getWriteBufferPtr());
diff --git a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
index 6358a99d6b4..a56c24a740a 100644
--- a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
+++ b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.cpp
@@ -26,8 +26,6 @@ RowInputFormatWithDiagnosticInfo::RowInputFormatWithDiagnosticInfo(const Block &
 
 void RowInputFormatWithDiagnosticInfo::updateDiagnosticInfo()
 {
-    ++row_num;
-
     bytes_read_at_start_of_buffer_on_prev_row = bytes_read_at_start_of_buffer_on_current_row;
     bytes_read_at_start_of_buffer_on_current_row = in->count() - in->offset();
 
@@ -73,7 +71,7 @@ std::pair<String, String> RowInputFormatWithDiagnosticInfo::getDiagnosticAndRawD
     {
         in->position() = in->buffer().begin() + offset_of_prev_row;
 
-        out_diag << "\nRow " << (row_num - 1) << ":\n";
+        out_diag << "\nRow " << getRowNum() - 1 << ":\n";
         if (!parseRowAndPrintDiagnosticInfo(columns, out_diag))
             return std::make_pair(out_diag.str(), out_data.str());
     }
@@ -96,7 +94,7 @@ std::pair<String, String> RowInputFormatWithDiagnosticInfo::getDiagnosticAndRawD
         ++data;
     }
 
-    out_diag << "\nRow " << row_num << ":\n";
+    out_diag << "\nRow " << getRowNum() << ":\n";
     parseRowAndPrintDiagnosticInfo(columns, out_diag);
     out_diag << "\n";
 
@@ -193,7 +191,6 @@ bool RowInputFormatWithDiagnosticInfo::deserializeFieldAndPrintDiagnosticInfo(co
 void RowInputFormatWithDiagnosticInfo::resetParser()
 {
     IRowInputFormat::resetParser();
-    row_num = 0;
     bytes_read_at_start_of_buffer_on_current_row = 0;
     bytes_read_at_start_of_buffer_on_prev_row = 0;
     offset_of_current_row = std::numeric_limits<size_t>::max();
diff --git a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.h b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.h
index 49793fcd208..f067ebd7583 100644
--- a/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.h
+++ b/src/Processors/Formats/RowInputFormatWithDiagnosticInfo.h
@@ -29,9 +29,6 @@ protected:
     virtual void tryDeserializeField(const DataTypePtr & type, IColumn & column, size_t file_column) = 0;
     virtual bool isGarbageAfterField(size_t after_input_pos_idx, ReadBuffer::Position pos) = 0;
 
-    /// For convenient diagnostics in case of an error.
-    size_t row_num = 0;
-
 private:
     /// How many bytes were read, not counting those still in the buffer.
     size_t bytes_read_at_start_of_buffer_on_current_row = 0;
diff --git a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
index a6514257dd3..478ce41f924 100644
--- a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
+++ b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.cpp
@@ -66,11 +66,6 @@ RowInputFormatWithNamesAndTypes::RowInputFormatWithNamesAndTypes(
 
 void RowInputFormatWithNamesAndTypes::readPrefix()
 {
-    /// This is a bit of abstraction leakage, but we need it in parallel parsing:
-    /// we check if this InputFormat is working with the "real" beginning of the data.
-    if (getCurrentUnitNumber() != 0)
-        return;
-
     /// Search and remove BOM only in textual formats (CSV, TSV etc), not in binary ones (RowBinary*).
     /// Also, we assume that column name or type cannot contain BOM, so, if format has header,
     /// then BOM at beginning of stream cannot be confused with name or type of field, and it is safe to skip it.
@@ -206,7 +201,7 @@ bool RowInputFormatWithNamesAndTypes::readRow(MutableColumns & columns, RowReadE
 
     updateDiagnosticInfo();
 
-    if (likely(row_num != 1 || (getCurrentUnitNumber() == 0 && (with_names || with_types || is_header_detected))))
+    if (likely(getRowNum() != 0 || with_names || with_types || is_header_detected))
         format_reader->skipRowBetweenDelimiter();
 
     format_reader->skipRowStartDelimiter();
@@ -270,7 +265,7 @@ size_t RowInputFormatWithNamesAndTypes::countRows(size_t max_block_size)
         return 0;
 
     size_t num_rows = 0;
-    bool is_first_row = getTotalRows() == 0 && !with_names && !with_types && !is_header_detected;
+    bool is_first_row = getRowNum() == 0 && !with_names && !with_types && !is_header_detected;
     while (!format_reader->checkForSuffix() && num_rows < max_block_size)
     {
         if (likely(!is_first_row))
@@ -323,7 +318,7 @@ bool RowInputFormatWithNamesAndTypes::parseRowAndPrintDiagnosticInfo(MutableColu
     if (!format_reader->tryParseSuffixWithDiagnosticInfo(out))
         return false;
 
-    if (likely(row_num != 1) && !format_reader->parseRowBetweenDelimiterWithDiagnosticInfo(out))
+    if (likely(getRowNum() != 0) && !format_reader->parseRowBetweenDelimiterWithDiagnosticInfo(out))
         return false;
 
     if (!format_reader->parseRowStartWithDiagnosticInfo(out))
@@ -561,5 +556,10 @@ std::vector<String> FormatWithNamesAndTypesSchemaReader::readNamesFromFields(con
     return names;
 }
 
+void FormatWithNamesAndTypesSchemaReader::transformTypesIfNeeded(DB::DataTypePtr & type, DB::DataTypePtr & new_type)
+{
+    transformInferredTypesIfNeeded(type, new_type, format_settings);
+}
+
 }
 
diff --git a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h
index c263b3b9666..d0457990714 100644
--- a/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h
+++ b/src/Processors/Formats/RowInputFormatWithNamesAndTypes.h
@@ -172,6 +172,8 @@ public:
 
     NamesAndTypesList readSchema() override;
 
+    void transformTypesIfNeeded(DataTypePtr & type, DataTypePtr & new_type) override;
+
 protected:
     virtual std::optional<DataTypes> readRowAndGetDataTypes() override;
 
diff --git a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp
index 3525a5cab77..d2d2434c477 100644
--- a/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp
+++ b/src/Processors/Merges/Algorithms/AggregatingSortedAlgorithm.cpp
@@ -305,9 +305,9 @@ IMergingAlgorithm::Status AggregatingSortedAlgorithm::merge()
 
         {
             detail::RowRef current_key;
-            current_key.set(current);
+            setRowRef(current_key, current);
 
-            key_differs = last_key.empty() || !last_key.hasEqualSortColumnsWith(current_key);
+            key_differs = last_key.empty() || rowsHaveDifferentSortColumns(last_key, current_key);
 
             last_key = current_key;
             last_chunk_sort_columns.clear();
diff --git a/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.cpp b/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.cpp
index 1b47cb824d1..14325223602 100644
--- a/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.cpp
+++ b/src/Processors/Merges/Algorithms/CollapsingSortedAlgorithm.cpp
@@ -144,7 +144,7 @@ IMergingAlgorithm::Status CollapsingSortedAlgorithm::merge()
         if (last_row.empty())
             setRowRef(last_row, current);
 
-        bool key_differs = !last_row.hasEqualSortColumnsWith(current_row);
+        bool key_differs = rowsHaveDifferentSortColumns(last_row, current_row);
         if (key_differs)
         {
             /// if there are enough rows and the last one is calculated completely
diff --git a/src/Processors/Merges/Algorithms/Graphite.h b/src/Processors/Merges/Algorithms/Graphite.h
index 46b1bbbfcad..692e36d2eae 100644
--- a/src/Processors/Merges/Algorithms/Graphite.h
+++ b/src/Processors/Merges/Algorithms/Graphite.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <Common/SipHash.h>
 #include <Common/OptimizedRegularExpression.h>
 #include <AggregateFunctions/IAggregateFunction.h>
 
@@ -122,6 +123,17 @@ struct Pattern
     AggregateFunctionPtr function;
     Retentions retentions;    /// Must be ordered by 'age' descending.
     enum { TypeUndef, TypeRetention, TypeAggregation, TypeAll } type = TypeAll; /// The type of defined pattern, filled automatically
+    void updateHash(SipHash & hash) const
+    {
+        hash.update(rule_type);
+        hash.update(regexp_str);
+        hash.update(function->getName());
+        for (const auto & r : retentions)
+        {
+            hash.update(r.age);
+            hash.update(r.precision);
+        }
+    }
 };
 
 bool operator==(const Pattern & a, const Pattern & b);
@@ -142,6 +154,21 @@ struct Params
     Graphite::Patterns patterns;
     Graphite::Patterns patterns_plain;
     Graphite::Patterns patterns_tagged;
+    void updateHash(SipHash & hash) const
+    {
+        hash.update(path_column_name);
+        hash.update(time_column_name);
+        hash.update(value_column_name);
+        hash.update(value_column_name);
+        hash.update(version_column_name);
+        hash.update(patterns_typed);
+        for (const auto & p : patterns)
+            p.updateHash(hash);
+        for (const auto & p : patterns_plain)
+            p.updateHash(hash);
+        for (const auto & p : patterns_tagged)
+            p.updateHash(hash);
+    }
 };
 
 using RollupRule = std::pair<const RetentionPattern *, const AggregationPattern *>;
diff --git a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.cpp b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.cpp
index 68170924840..cbad6813fbc 100644
--- a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.cpp
+++ b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.cpp
@@ -1,11 +1,16 @@
 #include <Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.h>
+#include <Processors/Merges/Algorithms/MergeTreePartLevelInfo.h>
 
 
 namespace DB
 {
 
 IMergingAlgorithmWithDelayedChunk::IMergingAlgorithmWithDelayedChunk(Block header_, size_t num_inputs, SortDescription description_)
-    : description(std::move(description_)), header(std::move(header_)), current_inputs(num_inputs), cursors(num_inputs)
+    : description(std::move(description_))
+    , header(std::move(header_))
+    , current_inputs(num_inputs)
+    , cursors(num_inputs)
+    , inputs_origin_merge_tree_part_level(num_inputs)
 {
 }
 
@@ -20,6 +25,8 @@ void IMergingAlgorithmWithDelayedChunk::initializeQueue(Inputs inputs)
 
         cursors[source_num] = SortCursorImpl(
             header, current_inputs[source_num].chunk.getColumns(), description, source_num, current_inputs[source_num].permutation);
+
+        inputs_origin_merge_tree_part_level[source_num] = getPartLevelFromChunk(current_inputs[source_num].chunk);
     }
 
     queue = SortingQueue<SortCursor>(cursors);
@@ -36,6 +43,8 @@ void IMergingAlgorithmWithDelayedChunk::updateCursor(Input & input, size_t sourc
     current_input.swap(input);
     cursors[source_num].reset(current_input.chunk.getColumns(), header, current_input.permutation);
 
+    inputs_origin_merge_tree_part_level[source_num] = getPartLevelFromChunk(current_input.chunk);
+
     queue.push(cursors[source_num]);
 }
 
diff --git a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.h b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.h
index a8c5730cdb3..b8e73aec0dc 100644
--- a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.h
+++ b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithDelayedChunk.h
@@ -24,6 +24,15 @@ protected:
     void initializeQueue(Inputs inputs);
     void updateCursor(Input & input, size_t source_num);
     bool skipLastRowFor(size_t input_number) const { return current_inputs[input_number].skip_last_row; }
+    void setRowRef(detail::RowRef & row, SortCursor & cursor) { row.set(cursor); }
+    bool rowsHaveDifferentSortColumns(const detail::RowRef & lhs, const detail::RowRef & rhs)
+    {
+        /// By the time this method is called, `inputs_origin_merge_tree_part_level[lhs.source_stream_index]` must have been
+        /// initialized in either `initializeQueue` or `updateCursor`
+        if (lhs.source_stream_index == rhs.source_stream_index && inputs_origin_merge_tree_part_level[lhs.source_stream_index] > 0)
+            return true;
+        return !lhs.hasEqualSortColumnsWith(rhs);
+    }
 
 private:
     Block header;
@@ -32,6 +41,8 @@ private:
     Inputs current_inputs;
     SortCursorImpls cursors;
 
+    std::vector<size_t> inputs_origin_merge_tree_part_level;
+
     /// In merging algorithm, we need to compare current sort key with the last one.
     /// So, sorting columns for last row needed to be stored.
     /// In order to do it, we extend lifetime of last chunk and it's sort columns (from corresponding sort cursor).
diff --git a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.cpp b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.cpp
index 8c94a017271..c8b69382e89 100644
--- a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.cpp
+++ b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.cpp
@@ -1,4 +1,5 @@
 #include <Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.h>
+#include <Processors/Merges/Algorithms/MergeTreePartLevelInfo.h>
 
 namespace DB
 {
@@ -10,6 +11,7 @@ IMergingAlgorithmWithSharedChunks::IMergingAlgorithmWithSharedChunks(
     , chunk_allocator(num_inputs + max_row_refs)
     , cursors(num_inputs)
     , sources(num_inputs)
+    , sources_origin_merge_tree_part_level(num_inputs)
     , out_row_sources_buf(out_row_sources_buf_)
 {
 }
@@ -41,6 +43,8 @@ void IMergingAlgorithmWithSharedChunks::initialize(Inputs inputs)
 
         source.chunk->all_columns = cursors[source_num].all_columns;
         source.chunk->sort_columns = cursors[source_num].sort_columns;
+
+        sources_origin_merge_tree_part_level[source_num] = getPartLevelFromChunk(*source.chunk);
     }
 
     queue = SortingQueue<SortCursor>(cursors);
@@ -58,6 +62,8 @@ void IMergingAlgorithmWithSharedChunks::consume(Input & input, size_t source_num
     source.chunk->all_columns = cursors[source_num].all_columns;
     source.chunk->sort_columns = cursors[source_num].sort_columns;
 
+    sources_origin_merge_tree_part_level[source_num] = getPartLevelFromChunk(*source.chunk);
+
     queue.push(cursors[source_num]);
 }
 
diff --git a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.h b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.h
index 58c445b6ac4..3b4f9e92c5d 100644
--- a/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.h
+++ b/src/Processors/Merges/Algorithms/IMergingAlgorithmWithSharedChunks.h
@@ -35,6 +35,7 @@ protected:
     /// Sources currently being merged.
     using Sources = std::vector<Source>;
     Sources sources;
+    std::vector<size_t> sources_origin_merge_tree_part_level;
 
     SortingQueue<SortCursor> queue;
 
@@ -45,6 +46,14 @@ protected:
     using RowRef = detail::RowRefWithOwnedChunk;
     void setRowRef(RowRef & row, SortCursor & cursor) { row.set(cursor, sources[cursor.impl->order].chunk); }
     bool skipLastRowFor(size_t input_number) const { return sources[input_number].skip_last_row; }
+    bool rowsHaveDifferentSortColumns(const RowRef & lhs, const RowRef & rhs)
+    {
+        /// By the time this method is called, `sources_origin_merge_tree_part_level[lhs.source_stream_index]` must have been
+        /// initialized in either `initialize` or `consume`
+        if (lhs.source_stream_index == rhs.source_stream_index && sources_origin_merge_tree_part_level[lhs.source_stream_index] > 0)
+            return true;
+        return !lhs.hasEqualSortColumnsWith(rhs);
+    }
 };
 
 }
diff --git a/src/Processors/Merges/Algorithms/MergeTreePartLevelInfo.h b/src/Processors/Merges/Algorithms/MergeTreePartLevelInfo.h
new file mode 100644
index 00000000000..bcf4e759024
--- /dev/null
+++ b/src/Processors/Merges/Algorithms/MergeTreePartLevelInfo.h
@@ -0,0 +1,25 @@
+#pragma once
+
+#include <Processors/Chunk.h>
+
+namespace DB
+{
+
+/// To carry part level if chunk is produced by a merge tree source
+class MergeTreePartLevelInfo : public ChunkInfo
+{
+public:
+    MergeTreePartLevelInfo() = delete;
+    explicit MergeTreePartLevelInfo(ssize_t part_level) : origin_merge_tree_part_level(part_level) { }
+    size_t origin_merge_tree_part_level = 0;
+};
+
+inline size_t getPartLevelFromChunk(const Chunk & chunk)
+{
+    const auto & info = chunk.getChunkInfo();
+    if (const auto * part_level_info = typeid_cast<const MergeTreePartLevelInfo *>(info.get()))
+        return part_level_info->origin_merge_tree_part_level;
+    return 0;
+}
+
+}
diff --git a/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.cpp b/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.cpp
index 0c0598171b3..c1d68dfa6b4 100644
--- a/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.cpp
+++ b/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.cpp
@@ -21,12 +21,9 @@ ReplacingSortedAlgorithm::ReplacingSortedAlgorithm(
     size_t max_block_size_bytes,
     WriteBuffer * out_row_sources_buf_,
     bool use_average_block_sizes,
-    bool cleanup_,
-    size_t * cleanedup_rows_count_)
+    bool cleanup_)
     : IMergingAlgorithmWithSharedChunks(header_, num_inputs, std::move(description_), out_row_sources_buf_, max_row_refs)
-    , merged_data(header_.cloneEmptyColumns(), use_average_block_sizes, max_block_size_rows, max_block_size_bytes)
-    , cleanup(cleanup_)
-    , cleanedup_rows_count(cleanedup_rows_count_)
+    , merged_data(header_.cloneEmptyColumns(), use_average_block_sizes, max_block_size_rows, max_block_size_bytes), cleanup(cleanup_)
 {
     if (!is_deleted_column.empty())
         is_deleted_column_number = header_.getPositionByName(is_deleted_column);
@@ -67,7 +64,7 @@ IMergingAlgorithm::Status ReplacingSortedAlgorithm::merge()
         RowRef current_row;
         setRowRef(current_row, current);
 
-        bool key_differs = selected_row.empty() || !current_row.hasEqualSortColumnsWith(selected_row);
+        bool key_differs = selected_row.empty() || rowsHaveDifferentSortColumns(selected_row, current_row);
         if (key_differs)
         {
             /// if there are enough rows and the last one is calculated completely
@@ -77,16 +74,10 @@ IMergingAlgorithm::Status ReplacingSortedAlgorithm::merge()
             /// Write the data for the previous primary key.
             if (!selected_row.empty())
             {
-                if (is_deleted_column_number != -1)
+                if (is_deleted_column_number!=-1)
                 {
-                    uint8_t value = assert_cast<const ColumnUInt8 &>(*(*selected_row.all_columns)[is_deleted_column_number]).getData()[selected_row.row_num];
-                    if (!cleanup || !value)
+                    if (!(cleanup && assert_cast<const ColumnUInt8 &>(*(*selected_row.all_columns)[is_deleted_column_number]).getData()[selected_row.row_num]))
                         insertRow();
-                    else if (cleanup && cleanedup_rows_count != nullptr)
-                    {
-                        *cleanedup_rows_count += current_row_sources.size();
-                        current_row_sources.resize(0);
-                    }
                 }
                 else
                     insertRow();
@@ -100,7 +91,7 @@ IMergingAlgorithm::Status ReplacingSortedAlgorithm::merge()
         if (out_row_sources_buf)
             current_row_sources.emplace_back(current.impl->order, true);
 
-        if (is_deleted_column_number != -1)
+        if ((is_deleted_column_number!=-1))
         {
             const UInt8 is_deleted = assert_cast<const ColumnUInt8 &>(*current->all_columns[is_deleted_column_number]).getData()[current->getRow()];
             if ((is_deleted != 1) && (is_deleted != 0))
@@ -138,16 +129,10 @@ IMergingAlgorithm::Status ReplacingSortedAlgorithm::merge()
     /// We will write the data for the last primary key.
     if (!selected_row.empty())
     {
-        if (is_deleted_column_number != -1)
+        if (is_deleted_column_number!=-1)
         {
-            uint8_t value = assert_cast<const ColumnUInt8 &>(*(*selected_row.all_columns)[is_deleted_column_number]).getData()[selected_row.row_num];
-            if (!cleanup || !value)
+            if (!(cleanup && assert_cast<const ColumnUInt8 &>(*(*selected_row.all_columns)[is_deleted_column_number]).getData()[selected_row.row_num]))
                 insertRow();
-            else if (cleanup && cleanedup_rows_count != nullptr)
-            {
-                *cleanedup_rows_count += current_row_sources.size();
-                current_row_sources.resize(0);
-            }
         }
         else
             insertRow();
diff --git a/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h b/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h
index b2258918fde..d57bab4708c 100644
--- a/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h
+++ b/src/Processors/Merges/Algorithms/ReplacingSortedAlgorithm.h
@@ -27,8 +27,7 @@ public:
         size_t max_block_size_bytes,
         WriteBuffer * out_row_sources_buf_ = nullptr,
         bool use_average_block_sizes = false,
-        bool cleanup = false,
-        size_t * cleanedup_rows_count = nullptr);
+        bool cleanup = false);
 
     const char * getName() const override { return "ReplacingSortedAlgorithm"; }
     Status merge() override;
@@ -39,7 +38,6 @@ private:
     ssize_t is_deleted_column_number = -1;
     ssize_t version_column_number = -1;
     bool cleanup = false;
-    size_t * cleanedup_rows_count = nullptr;
 
     using RowRef = detail::RowRefWithOwnedChunk;
     static constexpr size_t max_row_refs = 2; /// last, current.
diff --git a/src/Processors/Merges/Algorithms/RowRef.h b/src/Processors/Merges/Algorithms/RowRef.h
index cf741c1b53b..c4dea2e3faa 100644
--- a/src/Processors/Merges/Algorithms/RowRef.h
+++ b/src/Processors/Merges/Algorithms/RowRef.h
@@ -129,6 +129,8 @@ struct RowRef
     size_t num_columns = 0;
     UInt64 row_num = 0;
 
+    UInt64 source_stream_index = 0;
+
     bool empty() const { return sort_columns == nullptr; }
     void reset() { sort_columns = nullptr; }
 
@@ -137,6 +139,7 @@ struct RowRef
         sort_columns = cursor.impl->sort_columns.data();
         num_columns = cursor.impl->sort_columns.size();
         row_num = cursor.impl->getRow();
+        source_stream_index = cursor.impl->order;
     }
 
     static bool checkEquals(size_t size, const IColumn ** lhs, size_t lhs_row, const IColumn ** rhs, size_t rhs_row)
@@ -171,12 +174,15 @@ struct RowRefWithOwnedChunk
     ColumnRawPtrs * sort_columns = nullptr;
     UInt64 row_num = 0;
 
+    UInt64 source_stream_index = 0;
+
     void swap(RowRefWithOwnedChunk & other)
     {
         owned_chunk.swap(other.owned_chunk);
         std::swap(all_columns, other.all_columns);
         std::swap(sort_columns, other.sort_columns);
         std::swap(row_num, other.row_num);
+        std::swap(source_stream_index, other.source_stream_index);
     }
 
     bool empty() const { return owned_chunk == nullptr; }
@@ -187,6 +193,7 @@ struct RowRefWithOwnedChunk
         all_columns = nullptr;
         sort_columns = nullptr;
         row_num = 0;
+        source_stream_index = 0;
     }
 
     void set(SortCursor & cursor, SharedChunkPtr chunk)
@@ -195,6 +202,7 @@ struct RowRefWithOwnedChunk
         row_num = cursor.impl->getRow();
         all_columns = &owned_chunk->all_columns;
         sort_columns = &owned_chunk->sort_columns;
+        source_stream_index = cursor.impl->order;
     }
 
     bool hasEqualSortColumnsWith(const RowRefWithOwnedChunk & other) const
diff --git a/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.cpp b/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.cpp
index fde58562531..845cf561968 100644
--- a/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.cpp
+++ b/src/Processors/Merges/Algorithms/SummingSortedAlgorithm.cpp
@@ -737,9 +737,9 @@ IMergingAlgorithm::Status SummingSortedAlgorithm::merge()
 
         {
             detail::RowRef current_key;
-            current_key.set(current);
+            setRowRef(current_key, current);
 
-            key_differs = last_key.empty() || !last_key.hasEqualSortColumnsWith(current_key);
+            key_differs = last_key.empty() || rowsHaveDifferentSortColumns(last_key, current_key);
 
             last_key = current_key;
             last_chunk_sort_columns.clear();
diff --git a/src/Processors/Merges/MergingSortedTransform.cpp b/src/Processors/Merges/MergingSortedTransform.cpp
index 572a5204df7..62275f37857 100644
--- a/src/Processors/Merges/MergingSortedTransform.cpp
+++ b/src/Processors/Merges/MergingSortedTransform.cpp
@@ -3,6 +3,7 @@
 #include <IO/WriteBuffer.h>
 
 #include <Common/logger_useful.h>
+#include <Common/formatReadable.h>
 
 namespace DB
 {
diff --git a/src/Processors/Merges/ReplacingSortedTransform.h b/src/Processors/Merges/ReplacingSortedTransform.h
index 7e293db1aa8..9cd2f29a862 100644
--- a/src/Processors/Merges/ReplacingSortedTransform.h
+++ b/src/Processors/Merges/ReplacingSortedTransform.h
@@ -19,8 +19,7 @@ public:
         size_t max_block_size_bytes,
         WriteBuffer * out_row_sources_buf_ = nullptr,
         bool use_average_block_sizes = false,
-        bool cleanup = false,
-        size_t * cleanedup_rows_count = nullptr)
+        bool cleanup = false)
         : IMergingTransform(
             num_inputs, header, header, /*have_all_inputs_=*/ true, /*limit_hint_=*/ 0, /*always_read_till_end_=*/ false,
             header,
@@ -32,8 +31,7 @@ public:
             max_block_size_bytes,
             out_row_sources_buf_,
             use_average_block_sizes,
-            cleanup,
-            cleanedup_rows_count)
+            cleanup)
     {
     }
 
diff --git a/src/Processors/QueryPlan/AggregatingStep.cpp b/src/Processors/QueryPlan/AggregatingStep.cpp
index c68a070f816..f374a7b7b10 100644
--- a/src/Processors/QueryPlan/AggregatingStep.cpp
+++ b/src/Processors/QueryPlan/AggregatingStep.cpp
@@ -231,7 +231,10 @@ void AggregatingStep::transformPipeline(QueryPipelineBuilder & pipeline, const B
                     transform_params->params.enable_prefetch,
                     /* only_merge */ false,
                     transform_params->params.optimize_group_by_constant_keys,
-                    transform_params->params.stats_collecting_params};
+                    transform_params->params.min_hit_rate_to_use_consecutive_keys_optimization,
+                    transform_params->params.stats_collecting_params,
+                };
+
                 auto transform_params_for_set = std::make_shared<AggregatingTransformParams>(src_header, std::move(params_for_set), final);
 
                 if (streams > 1)
diff --git a/src/Processors/QueryPlan/PartsSplitter.cpp b/src/Processors/QueryPlan/PartsSplitter.cpp
index 8bf877cf8b9..6ba6ed67456 100644
--- a/src/Processors/QueryPlan/PartsSplitter.cpp
+++ b/src/Processors/QueryPlan/PartsSplitter.cpp
@@ -30,6 +30,22 @@ std::string toString(const Values & value)
     return fmt::format("({})", fmt::join(value, ", "));
 }
 
+int compareValues(const Values & lhs, const Values & rhs)
+{
+    chassert(lhs.size() == rhs.size());
+
+    for (size_t i = 0; i < lhs.size(); ++i)
+    {
+        if (applyVisitor(FieldVisitorAccurateLess(), lhs[i], rhs[i]))
+            return -1;
+
+        if (!applyVisitor(FieldVisitorAccurateEquals(), lhs[i], rhs[i]))
+            return 1;
+    }
+
+    return 0;
+}
+
 /// Adaptor to access PK values from index.
 class IndexAccess
 {
@@ -49,81 +65,451 @@ public:
         return values;
     }
 
-    size_t getMarkRows(size_t part_idx, size_t mark) const { return parts[part_idx].data_part->index_granularity.getMarkRows(mark); }
-
-    size_t getTotalRowCount() const
+    std::optional<size_t> findRightmostMarkLessThanValueInRange(size_t part_index, Values value, size_t range_begin, size_t range_end) const
     {
-        size_t total = 0;
-        for (const auto & part : parts)
-            total += part.getRowsCount();
-        return total;
+        size_t left = range_begin;
+        size_t right = range_end;
+
+        while (left < right)
+        {
+            size_t middle = left + (right - left) / 2;
+            int compare_result = compareValues(getValue(part_index, middle), value);
+            if (compare_result != -1)
+                right = middle;
+            else
+                left = middle + 1;
+        }
+
+        if (right == range_begin)
+            return {};
+
+        return right - 1;
     }
 
+    std::optional<size_t> findRightmostMarkLessThanValueInRange(size_t part_index, Values value, MarkRange mark_range) const
+    {
+        return findRightmostMarkLessThanValueInRange(part_index, value, mark_range.begin, mark_range.end);
+    }
+
+    std::optional<size_t> findLeftmostMarkGreaterThanValueInRange(size_t part_index, Values value, size_t range_begin, size_t range_end) const
+    {
+        size_t left = range_begin;
+        size_t right = range_end;
+
+        while (left < right)
+        {
+            size_t middle = left + (right - left) / 2;
+            int compare_result = compareValues(getValue(part_index, middle), value);
+            if (compare_result != 1)
+                left = middle + 1;
+            else
+                right = middle;
+        }
+
+        if (left == range_end)
+            return {};
+
+        return left;
+    }
+
+    std::optional<size_t> findLeftmostMarkGreaterThanValueInRange(size_t part_index, Values value, MarkRange mark_range) const
+    {
+        return findLeftmostMarkGreaterThanValueInRange(part_index, value, mark_range.begin, mark_range.end);
+    }
+
+    size_t getMarkRows(size_t part_idx, size_t mark) const { return parts[part_idx].data_part->index_granularity.getMarkRows(mark); }
+
 private:
     const RangesInDataParts & parts;
 };
 
+class RangesInDataPartsBuilder
+{
+public:
+    explicit RangesInDataPartsBuilder(const RangesInDataParts & initial_ranges_in_data_parts_) : initial_ranges_in_data_parts(initial_ranges_in_data_parts_) { }
 
-/// Splits parts into layers, each layer will contain parts subranges with PK values from its own range.
-/// Will try to produce exactly max_layer layers but may return less if data is distributed in not a very parallelizable way.
-std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDataParts parts, size_t max_layers)
+    void addRange(size_t part_index, MarkRange mark_range)
+    {
+        auto [it, inserted] = part_index_to_current_ranges_in_data_parts_index.emplace(part_index, ranges_in_data_parts.size());
+
+        if (inserted)
+        {
+            ranges_in_data_parts.emplace_back(
+                initial_ranges_in_data_parts[part_index].data_part,
+                initial_ranges_in_data_parts[part_index].alter_conversions,
+                initial_ranges_in_data_parts[part_index].part_index_in_query,
+                MarkRanges{mark_range});
+            part_index_to_initial_ranges_in_data_parts_index[it->second] = part_index;
+            return;
+        }
+
+        ranges_in_data_parts[it->second].ranges.push_back(mark_range);
+    }
+
+    RangesInDataParts & getCurrentRangesInDataParts()
+    {
+        return ranges_in_data_parts;
+    }
+
+private:
+    std::unordered_map<size_t, size_t> part_index_to_current_ranges_in_data_parts_index;
+    std::unordered_map<size_t, size_t> part_index_to_initial_ranges_in_data_parts_index;
+    RangesInDataParts ranges_in_data_parts;
+    const RangesInDataParts & initial_ranges_in_data_parts;
+};
+
+struct PartsRangesIterator
+{
+    enum class EventType : uint8_t
+    {
+        RangeStart = 0,
+        RangeEnd,
+    };
+
+    [[maybe_unused]] bool operator<(const PartsRangesIterator & other) const
+    {
+        int compare_result = compareValues(value, other.value);
+        if (compare_result == -1)
+            return true;
+        else if (compare_result == 1)
+            return false;
+
+        if (part_index == other.part_index)
+        {
+            /// Within the same part we should process events in order of mark numbers,
+            /// because they already ordered by value and range ends have greater mark numbers than the beginnings.
+            /// Otherwise we could get invalid ranges with the right bound that is less than the left bound.
+            const auto ev_mark = event == EventType::RangeStart ? range.begin : range.end;
+            const auto other_ev_mark = other.event == EventType::RangeStart ? other.range.begin : other.range.end;
+
+            // Start event always before end event
+            if (ev_mark == other_ev_mark)
+                return event < other.event;
+
+            return ev_mark < other_ev_mark;
+        }
+
+        if (event == other.event)
+            return part_index < other.part_index;
+
+        // Start event always before end event
+        return event < other.event;
+    }
+
+    [[maybe_unused]] bool operator==(const PartsRangesIterator & other) const
+    {
+        if (value.size() != other.value.size())
+            return false;
+
+        for (size_t i = 0; i < value.size(); ++i)
+            if (!applyVisitor(FieldVisitorAccurateEquals(), value[i], other.value[i]))
+                return false;
+
+        return range == other.range && part_index == other.part_index && event == other.event;
+    }
+
+    [[maybe_unused]] bool operator>(const PartsRangesIterator & other) const
+    {
+        if (operator<(other) || operator==(other))
+            return false;
+
+        return true;
+    }
+
+    Values value;
+    MarkRange range;
+    size_t part_index;
+    EventType event;
+};
+
+struct SplitPartsRangesResult
+{
+    RangesInDataParts non_intersecting_parts_ranges;
+    RangesInDataParts intersecting_parts_ranges;
+};
+
+SplitPartsRangesResult splitPartsRanges(RangesInDataParts ranges_in_data_parts, bool force_process_all_ranges)
+{
+    /** Split ranges in data parts into intersecting ranges in data parts and non intersecting ranges in data parts.
+      *
+      * For each marks range we will create 2 events (RangeStart, RangeEnd), add these events into array and sort them by primary key index
+      * value at this event.
+      *
+      * After that we will scan sorted events and maintain current intersecting parts ranges.
+      * If current intersecting parts ranges is 1, for each event (RangeStart, RangeEnd) we can extract non intersecting range
+      * from single part range.
+      *
+      * There can be 4 possible cases:
+      *
+      * 1. RangeStart after RangeStart:
+      *
+      * Example:
+      *
+      * range 1 [----            ...
+      * range 2      [(value_1)    ...
+      *
+      * In this scenario we can extract non intersecting part of range 1. This non intersecting part will have start
+      * of range 1 and end with rightmost mark from range 1 that contains value less than value_1.
+      *
+      * 2. RangeStart after RangeEnd:
+      *
+      * Example:
+      *
+      * range 1   [              ----              ...
+      * range 2   [   (value_1)]
+      * range 3                      [(value_2)    ...
+      *
+      * In this case we can extract non intersecting part of range 1. This non intersecting part will have start
+      * of leftmost mark from range 1 that contains value greater than value_1 and end with rightmost mark from range 1
+      * that contains value less than value_2.
+      *
+      * 3. RangeEnd after RangeStart:
+      *
+      * Example:
+      *
+      * range 1   [----]
+      *
+      * In this case we can extract range 1 as non intersecting.
+      *
+      * 4. RangeEnd after RangeEnd
+      *
+      * Example:
+      *
+      * range 1    [    ...              ----]
+      * range 2    [    ...    (value_1)]
+      *
+      * In this case we can extract non intersecting part of range 1. This non intersecting part will have start
+      * of leftmost mark from range 1 that contains value greater than value_1 and end with range 1 end.
+      *
+      * Additional details:
+      *
+      * 1. If part level is 0, we must process all ranges from this part, because they can contain duplicate primary keys.
+      * 2. If non intersecting range is small, it is better to not add it to non intersecting ranges, to avoid expensive seeks.
+      */
+
+    IndexAccess index_access(ranges_in_data_parts);
+    std::vector<PartsRangesIterator> parts_ranges;
+
+    for (size_t part_index = 0; part_index < ranges_in_data_parts.size(); ++part_index)
+    {
+        for (const auto & range : ranges_in_data_parts[part_index].ranges)
+        {
+            const auto & index_granularity = ranges_in_data_parts[part_index].data_part->index_granularity;
+            parts_ranges.push_back(
+                {index_access.getValue(part_index, range.begin), range, part_index, PartsRangesIterator::EventType::RangeStart});
+
+            const bool value_is_defined_at_end_mark = range.end < index_granularity.getMarksCount();
+            if (!value_is_defined_at_end_mark)
+                continue;
+
+            parts_ranges.push_back(
+                {index_access.getValue(part_index, range.end), range, part_index, PartsRangesIterator::EventType::RangeEnd});
+        }
+    }
+
+    std::sort(parts_ranges.begin(), parts_ranges.end());
+
+    RangesInDataPartsBuilder intersecting_ranges_in_data_parts_builder(ranges_in_data_parts);
+    RangesInDataPartsBuilder non_intersecting_ranges_in_data_parts_builder(ranges_in_data_parts);
+
+    static constexpr size_t min_number_of_marks_for_non_intersecting_range = 2;
+
+    auto add_non_intersecting_range = [&](size_t part_index, MarkRange mark_range)
+    {
+        non_intersecting_ranges_in_data_parts_builder.addRange(part_index, mark_range);
+    };
+
+    auto add_intersecting_range = [&](size_t part_index, MarkRange mark_range)
+    {
+        intersecting_ranges_in_data_parts_builder.addRange(part_index, mark_range);
+    };
+
+    std::unordered_map<size_t, MarkRange> part_index_start_to_range;
+
+    chassert(!parts_ranges.empty());
+    chassert(parts_ranges[0].event == PartsRangesIterator::EventType::RangeStart);
+    part_index_start_to_range[parts_ranges[0].part_index] = parts_ranges[0].range;
+
+    size_t parts_ranges_size = parts_ranges.size();
+    for (size_t i = 1; i < parts_ranges_size; ++i)
+    {
+        auto & previous_part_range = parts_ranges[i - 1];
+        auto & current_part_range = parts_ranges[i];
+        size_t intersecting_parts = part_index_start_to_range.size();
+        bool range_start = current_part_range.event == PartsRangesIterator::EventType::RangeStart;
+
+        if (range_start)
+        {
+            auto [it, inserted] = part_index_start_to_range.emplace(current_part_range.part_index, current_part_range.range);
+            chassert(inserted);
+
+            if (intersecting_parts != 1)
+                continue;
+
+            if (previous_part_range.event == PartsRangesIterator::EventType::RangeStart)
+            {
+                /// If part level is 0, we must process whole previous part because it can contain duplicate primary keys
+                if (force_process_all_ranges || ranges_in_data_parts[previous_part_range.part_index].data_part->info.level == 0)
+                    continue;
+
+                /// Case 1 Range Start after Range Start
+                size_t begin = previous_part_range.range.begin;
+                std::optional<size_t> end_optional = index_access.findRightmostMarkLessThanValueInRange(previous_part_range.part_index,
+                    current_part_range.value,
+                    previous_part_range.range);
+
+                if (!end_optional)
+                    continue;
+
+                size_t end = *end_optional;
+
+                if (end - begin >= min_number_of_marks_for_non_intersecting_range)
+                {
+                    part_index_start_to_range[previous_part_range.part_index].begin = end;
+                    add_non_intersecting_range(previous_part_range.part_index, MarkRange{begin, end});
+                }
+
+                continue;
+            }
+
+            auto other_interval_it = part_index_start_to_range.begin();
+            for (; other_interval_it != part_index_start_to_range.end(); ++other_interval_it)
+            {
+                if (other_interval_it != it)
+                    break;
+            }
+
+            chassert(other_interval_it != part_index_start_to_range.end());
+            size_t other_interval_part_index = other_interval_it->first;
+            MarkRange other_interval_range = other_interval_it->second;
+
+            /// If part level is 0, we must process whole other intersecting part because it can contain duplicate primary keys
+            if (force_process_all_ranges || ranges_in_data_parts[other_interval_part_index].data_part->info.level == 0)
+                continue;
+
+            /// Case 2 Range Start after Range End
+            std::optional<size_t> begin_optional = index_access.findLeftmostMarkGreaterThanValueInRange(other_interval_part_index,
+                previous_part_range.value,
+                other_interval_range);
+            if (!begin_optional)
+                continue;
+
+            std::optional<size_t> end_optional = index_access.findRightmostMarkLessThanValueInRange(other_interval_part_index,
+                current_part_range.value,
+                other_interval_range);
+            if (!end_optional)
+                continue;
+
+            size_t begin = *end_optional;
+            size_t end = *end_optional;
+
+            if (end - begin >= min_number_of_marks_for_non_intersecting_range)
+            {
+                other_interval_it->second.begin = end;
+                add_intersecting_range(other_interval_part_index, MarkRange{other_interval_range.begin, begin});
+                add_non_intersecting_range(other_interval_part_index, MarkRange{begin, end});
+            }
+            continue;
+        }
+
+        chassert(current_part_range.event == PartsRangesIterator::EventType::RangeEnd);
+
+        /** If there are more than 1 part ranges that we are currently processing
+          * that means that this part range is intersecting with other range.
+          *
+          * If part level is 0, we must process whole part because it can contain duplicate primary keys.
+          */
+        if (intersecting_parts != 1 || force_process_all_ranges || ranges_in_data_parts[current_part_range.part_index].data_part->info.level == 0)
+        {
+            add_intersecting_range(current_part_range.part_index, part_index_start_to_range[current_part_range.part_index]);
+            part_index_start_to_range.erase(current_part_range.part_index);
+            continue;
+        }
+
+        if (previous_part_range.event == PartsRangesIterator::EventType::RangeStart)
+        {
+            chassert(current_part_range.part_index == previous_part_range.part_index);
+            chassert(current_part_range.range == previous_part_range.range);
+
+            /// Case 3 Range End after Range Start
+            non_intersecting_ranges_in_data_parts_builder.addRange(current_part_range.part_index, current_part_range.range);
+            part_index_start_to_range.erase(current_part_range.part_index);
+            continue;
+        }
+
+        chassert(previous_part_range.event == PartsRangesIterator::EventType::RangeEnd);
+        chassert(previous_part_range.part_index != current_part_range.part_index);
+
+        /// Case 4 Range End after Range End
+        std::optional<size_t> begin_optional = index_access.findLeftmostMarkGreaterThanValueInRange(current_part_range.part_index,
+            previous_part_range.value,
+            current_part_range.range);
+        size_t end = current_part_range.range.end;
+
+        if (begin_optional && end - *begin_optional >= min_number_of_marks_for_non_intersecting_range)
+        {
+            size_t begin = *begin_optional;
+            add_intersecting_range(current_part_range.part_index, MarkRange{part_index_start_to_range[current_part_range.part_index].begin, begin});
+            add_non_intersecting_range(current_part_range.part_index, MarkRange{begin, end});
+        }
+        else
+        {
+            add_intersecting_range(current_part_range.part_index, MarkRange{part_index_start_to_range[current_part_range.part_index].begin, end});
+        }
+
+        part_index_start_to_range.erase(current_part_range.part_index);
+    }
+
+    /// Process parts ranges with undefined value at end mark
+    bool is_intersecting = part_index_start_to_range.size() > 1;
+    for (const auto & [part_index, mark_range] : part_index_start_to_range)
+    {
+        if (is_intersecting)
+            add_intersecting_range(part_index, mark_range);
+        else
+            add_non_intersecting_range(part_index, mark_range);
+    }
+
+    auto && non_intersecting_ranges_in_data_parts = std::move(non_intersecting_ranges_in_data_parts_builder.getCurrentRangesInDataParts());
+    auto && intersecting_ranges_in_data_parts = std::move(intersecting_ranges_in_data_parts_builder.getCurrentRangesInDataParts());
+
+    std::stable_sort(
+        non_intersecting_ranges_in_data_parts.begin(),
+        non_intersecting_ranges_in_data_parts.end(),
+        [](const auto & lhs, const auto & rhs) { return lhs.part_index_in_query < rhs.part_index_in_query; });
+
+    std::stable_sort(
+        intersecting_ranges_in_data_parts.begin(),
+        intersecting_ranges_in_data_parts.end(),
+        [](const auto & lhs, const auto & rhs) { return lhs.part_index_in_query < rhs.part_index_in_query; });
+
+    return {std::move(non_intersecting_ranges_in_data_parts), std::move(intersecting_ranges_in_data_parts)};
+}
+
+std::pair<std::vector<RangesInDataParts>, std::vector<Values>> splitIntersectingPartsRangesIntoLayers(RangesInDataParts intersecting_ranges_in_data_parts, size_t max_layers)
 {
     // We will advance the iterator pointing to the mark with the smallest PK value until
     // there will be not less than rows_per_layer rows in the current layer (roughly speaking).
     // Then we choose the last observed value as the new border, so the current layer will consists
     // of granules with values greater than the previous mark and less or equal than the new border.
 
-    struct PartsRangesIterator
+    IndexAccess index_access(intersecting_ranges_in_data_parts);
+    std::priority_queue<PartsRangesIterator, std::vector<PartsRangesIterator>, std::greater<>> parts_ranges_queue;
+
+    for (size_t part_index = 0; part_index < intersecting_ranges_in_data_parts.size(); ++part_index)
     {
-        struct MarkRangeWithPartIdx : MarkRange
-        {
-            size_t part_idx;
-        };
-
-        enum class EventType
-        {
-            RangeStart,
-            RangeEnd,
-        };
-
-        [[maybe_unused]] bool operator<(const PartsRangesIterator & other) const
-        {
-            // Accurate comparison of `value > other.value`
-            for (size_t i = 0; i < value.size(); ++i)
-            {
-                if (applyVisitor(FieldVisitorAccurateLess(), value[i], other.value[i]))
-                    return false;
-
-                if (!applyVisitor(FieldVisitorAccurateEquals(), value[i], other.value[i]))
-                    return true;
-            }
-
-            /// Within the same part we should process events in order of mark numbers,
-            /// because they already ordered by value and range ends have greater mark numbers than the beginnings.
-            /// Otherwise we could get invalid ranges with the right bound that is less than the left bound.
-            const auto ev_mark = event == EventType::RangeStart ? range.begin : range.end;
-            const auto other_ev_mark = other.event == EventType::RangeStart ? other.range.begin : other.range.end;
-            return ev_mark > other_ev_mark;
-        }
-
-        Values value;
-        MarkRangeWithPartIdx range;
-        EventType event;
-    };
-
-    const auto index_access = std::make_unique<IndexAccess>(parts);
-    std::priority_queue<PartsRangesIterator> parts_ranges_queue;
-    for (size_t part_idx = 0; part_idx < parts.size(); ++part_idx)
-    {
-        for (const auto & range : parts[part_idx].ranges)
+        for (const auto & range : intersecting_ranges_in_data_parts[part_index].ranges)
         {
+            const auto & index_granularity = intersecting_ranges_in_data_parts[part_index].data_part->index_granularity;
             parts_ranges_queue.push(
-                {index_access->getValue(part_idx, range.begin), {range, part_idx}, PartsRangesIterator::EventType::RangeStart});
-            const auto & index_granularity = parts[part_idx].data_part->index_granularity;
+                {index_access.getValue(part_index, range.begin), range, part_index, PartsRangesIterator::EventType::RangeStart});
+
             const bool value_is_defined_at_end_mark = range.end < index_granularity.getMarksCount();
-            if (value_is_defined_at_end_mark)
-                parts_ranges_queue.push(
-                    {index_access->getValue(part_idx, range.end), {range, part_idx}, PartsRangesIterator::EventType::RangeEnd});
+            if (!value_is_defined_at_end_mark)
+                continue;
+
+            parts_ranges_queue.push(
+                {index_access.getValue(part_index, range.end), range, part_index, PartsRangesIterator::EventType::RangeEnd});
         }
     }
 
@@ -136,7 +522,8 @@ std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDat
     std::vector<Values> borders;
     std::vector<RangesInDataParts> result_layers;
 
-    const size_t rows_per_layer = std::max<size_t>(index_access->getTotalRowCount() / max_layers, 1);
+    size_t total_intersecting_rows_count = intersecting_ranges_in_data_parts.getRowsCountAllParts();
+    const size_t rows_per_layer = std::max<size_t>(total_intersecting_rows_count / max_layers, 1);
 
     while (!parts_ranges_queue.empty())
     {
@@ -152,9 +539,8 @@ std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDat
             return marks_in_current_layer < intersected_parts * 2;
         };
 
-        auto & current_layer = result_layers.emplace_back();
-        /// Map part_idx into index inside layer, used to merge marks from the same part into one reader
-        std::unordered_map<size_t, size_t> part_idx_in_layer;
+        RangesInDataPartsBuilder current_layer_builder(intersecting_ranges_in_data_parts);
+        result_layers.emplace_back();
 
         while (rows_in_current_layer < rows_per_layer || layers_intersection_is_too_big() || result_layers.size() == max_layers)
         {
@@ -164,57 +550,47 @@ std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDat
             {
                 auto current = parts_ranges_queue.top();
                 parts_ranges_queue.pop();
-                const auto part_idx = current.range.part_idx;
+                const auto part_index = current.part_index;
 
                 if (current.event == PartsRangesIterator::EventType::RangeEnd)
                 {
-                    const auto & mark = MarkRange{current_part_range_begin[part_idx], current.range.end};
-                    auto it = part_idx_in_layer.emplace(std::make_pair(part_idx, current_layer.size()));
-                    if (it.second)
-                        current_layer.emplace_back(
-                            parts[part_idx].data_part,
-                            parts[part_idx].alter_conversions,
-                            parts[part_idx].part_index_in_query,
-                            MarkRanges{mark});
-                    else
-                        current_layer[it.first->second].ranges.push_back(mark);
-
-                    current_part_range_begin.erase(part_idx);
-                    current_part_range_end.erase(part_idx);
+                    current_layer_builder.addRange(part_index, MarkRange{current_part_range_begin[part_index], current.range.end});
+                    current_part_range_begin.erase(part_index);
+                    current_part_range_end.erase(part_index);
                     continue;
                 }
 
                 last_value = std::move(current.value);
-                rows_in_current_layer += index_access->getMarkRows(part_idx, current.range.begin);
-                marks_in_current_layer++;
-                current_part_range_begin.try_emplace(part_idx, current.range.begin);
-                current_part_range_end[part_idx] = current.range.begin;
+                rows_in_current_layer += index_access.getMarkRows(part_index, current.range.begin);
+                ++marks_in_current_layer;
+
+                current_part_range_begin.try_emplace(part_index, current.range.begin);
+                current_part_range_end[part_index] = current.range.begin;
+
                 if (current.range.begin + 1 < current.range.end)
                 {
-                    current.range.begin++;
-                    current.value = index_access->getValue(part_idx, current.range.begin);
+                    ++current.range.begin;
+                    current.value = index_access.getValue(part_index, current.range.begin);
                     parts_ranges_queue.push(std::move(current));
                 }
             }
+
             if (parts_ranges_queue.empty())
                 break;
+
             if (rows_in_current_layer >= rows_per_layer && !layers_intersection_is_too_big() && result_layers.size() < max_layers)
                 borders.push_back(last_value);
         }
-        for (const auto & [part_idx, last_mark] : current_part_range_end)
+
+        for (const auto & [part_index, last_mark] : current_part_range_end)
         {
-            const auto & mark = MarkRange{current_part_range_begin[part_idx], last_mark + 1};
-            auto it = part_idx_in_layer.emplace(std::make_pair(part_idx, current_layer.size()));
-
-            if (it.second)
-                result_layers.back().emplace_back(
-                    parts[part_idx].data_part, parts[part_idx].alter_conversions, parts[part_idx].part_index_in_query, MarkRanges{mark});
-            else
-                current_layer[it.first->second].ranges.push_back(mark);
-
-            current_part_range_begin[part_idx] = current_part_range_end[part_idx];
+            current_layer_builder.addRange(part_index, MarkRange{current_part_range_begin[part_index], last_mark + 1});
+            current_part_range_begin[part_index] = current_part_range_end[part_index];
         }
+
+        result_layers.back() = std::move(current_layer_builder.getCurrentRangesInDataParts());
     }
+
     for (auto & layer : result_layers)
     {
         std::stable_sort(
@@ -223,7 +599,7 @@ std::pair<std::vector<Values>, std::vector<RangesInDataParts>> split(RangesInDat
             [](const auto & lhs, const auto & rhs) { return lhs.part_index_in_query < rhs.part_index_in_query; });
     }
 
-    return {std::move(borders), std::move(result_layers)};
+    return {std::move(result_layers), std::move(borders)};
 }
 
 
@@ -329,36 +705,44 @@ static void reorderColumns(ActionsDAG & dag, const Block & header, const std::st
     dag.getOutputs() = std::move(new_outputs);
 }
 
-Pipes buildPipesForReadingByPKRanges(
+SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     const KeyDescription & primary_key,
     ExpressionActionsPtr sorting_expr,
     RangesInDataParts parts,
     size_t max_layers,
     ContextPtr context,
-    ReadingInOrderStepGetter && reading_step_getter)
+    ReadingInOrderStepGetter && in_order_reading_step_getter,
+    bool force_process_all_ranges)
 {
     if (max_layers <= 1)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "max_layer should be greater than 1");
 
-    auto && [borders, result_layers] = split(std::move(parts), max_layers);
-    auto filters = buildFilters(primary_key, borders);
+    SplitPartsWithRangesByPrimaryKeyResult result;
 
-    Pipes pipes(result_layers.size());
-    for (size_t i = 0; i < result_layers.size(); ++i)
+    SplitPartsRangesResult split_result = splitPartsRanges(std::move(parts), force_process_all_ranges);
+    result.non_intersecting_parts_ranges = std::move(split_result.non_intersecting_parts_ranges);
+
+    auto && [layers, borders] = splitIntersectingPartsRangesIntoLayers(std::move(split_result.intersecting_parts_ranges), max_layers);
+    auto filters = buildFilters(primary_key, borders);
+    result.merging_pipes.resize(layers.size());
+
+    for (size_t i = 0; i < layers.size(); ++i)
     {
-        pipes[i] = reading_step_getter(std::move(result_layers[i]));
-        pipes[i].addSimpleTransform([sorting_expr](const Block & header)
+        result.merging_pipes[i] = in_order_reading_step_getter(std::move(layers[i]));
+        result.merging_pipes[i].addSimpleTransform([sorting_expr](const Block & header)
                                     { return std::make_shared<ExpressionTransform>(header, sorting_expr); });
+
         auto & filter_function = filters[i];
         if (!filter_function)
             continue;
+
         auto syntax_result = TreeRewriter(context).analyze(filter_function, primary_key.expression->getRequiredColumnsWithTypes());
         auto actions = ExpressionAnalyzer(filter_function, syntax_result, context).getActionsDAG(false);
-        reorderColumns(*actions, pipes[i].getHeader(), filter_function->getColumnName());
+        reorderColumns(*actions, result.merging_pipes[i].getHeader(), filter_function->getColumnName());
         ExpressionActionsPtr expression_actions = std::make_shared<ExpressionActions>(std::move(actions));
         auto description = fmt::format(
             "filter values in ({}, {}]", i ? ::toString(borders[i - 1]) : "-inf", i < borders.size() ? ::toString(borders[i]) : "+inf");
-        pipes[i].addSimpleTransform(
+        result.merging_pipes[i].addSimpleTransform(
             [&](const Block & header)
             {
                 auto step = std::make_shared<FilterSortedStreamByRange>(header, expression_actions, filter_function->getColumnName(), true);
@@ -366,7 +750,8 @@ Pipes buildPipesForReadingByPKRanges(
                 return step;
             });
     }
-    return pipes;
+
+    return result;
 }
 
 }
diff --git a/src/Processors/QueryPlan/PartsSplitter.h b/src/Processors/QueryPlan/PartsSplitter.h
index 92ba6191e97..f1ed1cb0b9c 100644
--- a/src/Processors/QueryPlan/PartsSplitter.h
+++ b/src/Processors/QueryPlan/PartsSplitter.h
@@ -13,15 +13,26 @@ namespace DB
 
 using ReadingInOrderStepGetter = std::function<Pipe(RangesInDataParts)>;
 
-/// Splits parts into layers, each layer will contain parts subranges with PK values from its own range.
-/// A separate pipe will be constructed for each layer with a reading step (provided by the reading_step_getter) and
-/// a filter for this layer's range of PK values.
-/// Will try to produce exactly max_layer pipes but may return less if data is distributed in not a very parallelizable way.
-Pipes buildPipesForReadingByPKRanges(
+struct SplitPartsWithRangesByPrimaryKeyResult
+{
+    RangesInDataParts non_intersecting_parts_ranges;
+    Pipes merging_pipes;
+};
+
+/** Splits parts ranges into:
+  *
+  * 1. Non interesecing part ranges, for parts with level > 0.
+  * 2. Merging layers, that contain ranges from multiple parts. A separate pipe will be constructed for each layer
+  * with a reading step (provided by the in_order_reading_step_getter) and a filter for this layer's range of PK values.
+  *
+  * Will try to produce exactly max_layer layers but may return less if data is distributed in not a very parallelizable way.
+  */
+SplitPartsWithRangesByPrimaryKeyResult splitPartsWithRangesByPrimaryKey(
     const KeyDescription & primary_key,
     ExpressionActionsPtr sorting_expr,
     RangesInDataParts parts,
     size_t max_layers,
     ContextPtr context,
-    ReadingInOrderStepGetter && reading_step_getter);
+    ReadingInOrderStepGetter && in_order_reading_step_getter,
+    bool force_process_all_ranges);
 }
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.cpp b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
index 2ceb0f2dc7f..aa1c463e4e6 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.cpp
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.cpp
@@ -568,6 +568,8 @@ Pipe ReadFromMergeTree::readInOrder(
             pool, std::move(algorithm), data, prewhere_info,
             actions_settings, block_size, reader_settings, virt_column_names);
 
+        processor->addPartLevelToChunk(isQueryWithFinal());
+
         auto source = std::make_shared<MergeTreeSource>(std::move(processor));
         if (set_rows_approx)
             source->addTotalRowsApprox(total_rows);
@@ -1042,6 +1044,38 @@ static void addMergingFinal(
     pipe.addTransform(get_merging_processor());
 }
 
+bool ReadFromMergeTree::doNotMergePartsAcrossPartitionsFinal() const
+{
+    const auto & settings = context->getSettingsRef();
+
+    /// If setting do_not_merge_across_partitions_select_final is set always prefer it
+    if (settings.do_not_merge_across_partitions_select_final.changed)
+        return settings.do_not_merge_across_partitions_select_final;
+
+    if (!metadata_for_reading->hasPrimaryKey() || !metadata_for_reading->hasPartitionKey())
+        return false;
+
+    /** To avoid merging parts across partitions we want result of partition key expression for
+      * rows with same primary key to be the same.
+      *
+      * If partition key expression is deterministic, and contains only columns that are included
+      * in primary key, then for same primary key column values, result of partition key expression
+      * will be the same.
+      */
+    const auto & partition_key_expression = metadata_for_reading->getPartitionKey().expression;
+    if (partition_key_expression->getActionsDAG().hasNonDeterministic())
+        return false;
+
+    const auto & primary_key_columns = metadata_for_reading->getPrimaryKey().column_names;
+    NameSet primary_key_columns_set(primary_key_columns.begin(), primary_key_columns.end());
+
+    const auto & partition_key_required_columns = partition_key_expression->getRequiredColumns();
+    for (const auto & partition_key_required_column : partition_key_required_columns)
+        if (!primary_key_columns_set.contains(partition_key_required_column))
+            return false;
+
+    return true;
+}
 
 Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
     RangesInDataParts && parts_with_ranges, size_t num_streams, const Names & origin_column_names, const Names & column_names, ActionsDAGPtr & out_projection)
@@ -1064,7 +1098,8 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
     auto it = parts_with_ranges.begin();
     parts_to_merge_ranges.push_back(it);
 
-    if (settings.do_not_merge_across_partitions_select_final)
+    bool do_not_merge_across_partitions_select_final = doNotMergePartsAcrossPartitionsFinal();
+    if (do_not_merge_across_partitions_select_final)
     {
         while (it != parts_with_ranges.end())
         {
@@ -1072,9 +1107,6 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
                 it, parts_with_ranges.end(), [&it](auto & part) { return it->data_part->info.partition_id != part.data_part->info.partition_id; });
             parts_to_merge_ranges.push_back(it);
         }
-        /// We divide threads for each partition equally. But we will create at least the number of partitions threads.
-        /// (So, the total number of threads could be more than initial num_streams.
-        num_streams /= (parts_to_merge_ranges.size() - 1);
     }
     else
     {
@@ -1087,8 +1119,7 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
 
     /// If do_not_merge_across_partitions_select_final is true and num_streams > 1
     /// we will store lonely parts with level > 0 to use parallel select on them.
-    RangesInDataParts lonely_parts;
-    size_t sum_marks_in_lonely_parts = 0;
+    RangesInDataParts non_intersecting_parts_by_primary_key;
 
     auto sorting_expr = std::make_shared<ExpressionActions>(metadata_for_reading->getSortingKey().expression->getActionsDAG().clone());
 
@@ -1097,36 +1128,31 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
         /// If do_not_merge_across_partitions_select_final is true and there is only one part in partition
         /// with level > 0 then we won't post-process this part, and if num_streams > 1 we
         /// can use parallel select on such parts.
-        bool no_merging_final = settings.do_not_merge_across_partitions_select_final &&
+        bool no_merging_final = do_not_merge_across_partitions_select_final &&
             std::distance(parts_to_merge_ranges[range_index], parts_to_merge_ranges[range_index + 1]) == 1 &&
             parts_to_merge_ranges[range_index]->data_part->info.level > 0 &&
             data.merging_params.is_deleted_column.empty();
+
+        if (no_merging_final)
+        {
+            non_intersecting_parts_by_primary_key.push_back(std::move(*parts_to_merge_ranges[range_index]));
+            continue;
+        }
+
         Pipes pipes;
         {
             RangesInDataParts new_parts;
 
-            if (no_merging_final)
-            {
-                if (num_streams > 1)
-                    sum_marks_in_lonely_parts += parts_to_merge_ranges[range_index]->getMarksCount();
-                lonely_parts.push_back(std::move(*parts_to_merge_ranges[range_index]));
-                continue;
-            }
-            else
-            {
-                for (auto part_it = parts_to_merge_ranges[range_index]; part_it != parts_to_merge_ranges[range_index + 1]; ++part_it)
-                {
-                    new_parts.emplace_back(part_it->data_part, part_it->alter_conversions, part_it->part_index_in_query, part_it->ranges);
-                }
-            }
+            for (auto part_it = parts_to_merge_ranges[range_index]; part_it != parts_to_merge_ranges[range_index + 1]; ++part_it)
+                new_parts.emplace_back(part_it->data_part, part_it->alter_conversions, part_it->part_index_in_query, part_it->ranges);
 
             if (new_parts.empty())
                 continue;
 
             if (num_streams > 1 && metadata_for_reading->hasPrimaryKey())
             {
-                // Let's split parts into layers to ensure data parallelism of FINAL.
-                auto reading_step_getter = [this, &column_names, &info](auto parts)
+                // Let's split parts into non intersecting parts ranges and layers to ensure data parallelism of FINAL.
+                auto in_order_reading_step_getter = [this, &column_names, &info](auto parts)
                 {
                     return this->read(
                         std::move(parts),
@@ -1137,13 +1163,24 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
                         info.use_uncompressed_cache);
                 };
 
-                pipes = buildPipesForReadingByPKRanges(
+                /// Parts of non-zero level still may contain duplicate PK values to merge on FINAL if there's is_deleted column,
+                /// so we have to process all ranges. It would be more optimal to remove this flag and add an extra filtering step.
+                bool force_process_all_ranges = !data.merging_params.is_deleted_column.empty();
+
+                SplitPartsWithRangesByPrimaryKeyResult split_ranges_result = splitPartsWithRangesByPrimaryKey(
                     metadata_for_reading->getPrimaryKey(),
                     sorting_expr,
                     std::move(new_parts),
                     num_streams,
                     context,
-                    std::move(reading_step_getter));
+                    std::move(in_order_reading_step_getter),
+                    force_process_all_ranges);
+
+                for (auto && non_intersecting_parts_range : split_ranges_result.non_intersecting_parts_ranges)
+                    non_intersecting_parts_by_primary_key.push_back(std::move(non_intersecting_parts_range));
+
+                for (auto && merging_pipe : split_ranges_result.merging_pipes)
+                    pipes.push_back(std::move(merging_pipe));
             }
             else
             {
@@ -1155,10 +1192,12 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
             }
 
             /// Drop temporary columns, added by 'sorting_key_expr'
-            if (!out_projection)
+            if (!out_projection && !pipes.empty())
                 out_projection = createProjection(pipes.front().getHeader());
         }
 
+        if (pipes.empty())
+            continue;
 
         Names sort_columns = metadata_for_reading->getSortingKeyColumns();
         SortDescription sort_description;
@@ -1184,45 +1223,9 @@ Pipe ReadFromMergeTree::spreadMarkRangesAmongStreamsFinal(
         merging_pipes.emplace_back(Pipe::unitePipes(std::move(pipes)));
     }
 
-    if (!lonely_parts.empty())
+    if (!non_intersecting_parts_by_primary_key.empty())
     {
-        Pipe pipe;
-        if (num_streams > 1)
-        {
-            size_t num_streams_for_lonely_parts = num_streams * lonely_parts.size();
-
-            const size_t min_marks_for_concurrent_read = MergeTreeDataSelectExecutor::minMarksForConcurrentRead(
-                settings.merge_tree_min_rows_for_concurrent_read,
-                settings.merge_tree_min_bytes_for_concurrent_read,
-                data_settings->index_granularity,
-                info.index_granularity_bytes,
-                sum_marks_in_lonely_parts);
-
-            /// Reduce the number of num_streams_for_lonely_parts if the data is small.
-            if (sum_marks_in_lonely_parts < num_streams_for_lonely_parts * min_marks_for_concurrent_read
-                && lonely_parts.size() < num_streams_for_lonely_parts)
-                num_streams_for_lonely_parts = std::max(
-                    (sum_marks_in_lonely_parts + min_marks_for_concurrent_read - 1) / min_marks_for_concurrent_read,
-                    lonely_parts.size());
-
-            pipe = read(
-                std::move(lonely_parts),
-                origin_column_names,
-                ReadFromMergeTree::ReadType::Default,
-                num_streams_for_lonely_parts,
-                min_marks_for_concurrent_read,
-                info.use_uncompressed_cache);
-        }
-        else
-        {
-            pipe = read(
-                std::move(lonely_parts),
-                origin_column_names,
-                ReadFromMergeTree::ReadType::InOrder,
-                num_streams,
-                0,
-                info.use_uncompressed_cache);
-        }
+        auto pipe = spreadMarkRangesAmongStreams(std::move(non_intersecting_parts_by_primary_key), num_streams, origin_column_names);
         no_merging_pipes.emplace_back(std::move(pipe));
     }
 
@@ -1338,8 +1341,7 @@ static void buildIndexes(
             filter_actions_dag,
             context,
             primary_key_column_names,
-            primary_key.expression,
-            array_join_name_set}, {}, {}, {}, false, {}});
+            primary_key.expression}, {}, {}, {}, {}, false, {}});
     }
     else
     {
@@ -1347,7 +1349,7 @@ static void buildIndexes(
             query_info,
             context,
             primary_key_column_names,
-            primary_key.expression}, {}, {}, {}, false, {}});
+            primary_key.expression}, {}, {}, {}, {}, false, {}});
     }
 
     if (metadata_snapshot->hasPartitionKey())
@@ -1356,7 +1358,7 @@ static void buildIndexes(
         auto minmax_columns_names = data.getMinMaxColumnsNames(partition_key);
         auto minmax_expression_actions = data.getMinMaxExpr(partition_key, ExpressionActionsSettings::fromContext(context));
 
-        indexes->minmax_idx_condition.emplace(filter_actions_dag, context, minmax_columns_names, minmax_expression_actions, NameSet());
+        indexes->minmax_idx_condition.emplace(filter_actions_dag, context, minmax_columns_names, minmax_expression_actions);
         indexes->partition_pruner.emplace(metadata_snapshot, filter_actions_dag, context, false /* strict */);
     }
 
@@ -1366,6 +1368,8 @@ static void buildIndexes(
     else
         indexes->part_values = MergeTreeDataSelectExecutor::filterPartsByVirtualColumns(data, parts, query_info.query, context);
 
+    MergeTreeDataSelectExecutor::buildKeyConditionFromPartOffset(indexes->part_offset_condition, filter_actions_dag, context);
+
     indexes->use_skip_indexes = settings.use_skip_indexes;
     bool final = query_info.isFinal();
 
@@ -1550,6 +1554,9 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
     }
     LOG_DEBUG(log, "Key condition: {}", indexes->key_condition.toString());
 
+    if (indexes->part_offset_condition)
+        LOG_DEBUG(log, "Part offset condition: {}", indexes->part_offset_condition->toString());
+
     if (indexes->key_condition.alwaysFalse())
         return std::make_shared<MergeTreeDataSelectAnalysisResult>(MergeTreeDataSelectAnalysisResult{.result = std::move(result)});
 
@@ -1596,6 +1603,7 @@ MergeTreeDataSelectAnalysisResultPtr ReadFromMergeTree::selectRangesToReadImpl(
             metadata_snapshot,
             context,
             indexes->key_condition,
+            indexes->part_offset_condition,
             indexes->skip_indexes,
             reader_settings,
             log,
diff --git a/src/Processors/QueryPlan/ReadFromMergeTree.h b/src/Processors/QueryPlan/ReadFromMergeTree.h
index 4e38e06c6af..e2c38ebb251 100644
--- a/src/Processors/QueryPlan/ReadFromMergeTree.h
+++ b/src/Processors/QueryPlan/ReadFromMergeTree.h
@@ -151,6 +151,7 @@ public:
         KeyCondition key_condition;
         std::optional<PartitionPruner> partition_pruner;
         std::optional<KeyCondition> minmax_idx_condition;
+        std::optional<KeyCondition> part_offset_condition;
         UsefulSkipIndexes skip_indexes;
         bool use_skip_indexes;
         std::optional<std::unordered_set<String>> part_values;
@@ -288,6 +289,8 @@ private:
         ActionsDAGPtr & out_projection,
         const InputOrderInfoPtr & input_order_info);
 
+    bool doNotMergePartsAcrossPartitionsFinal() const;
+
     Pipe spreadMarkRangesAmongStreamsFinal(
         RangesInDataParts && parts, size_t num_streams, const Names & origin_column_names, const Names & column_names, ActionsDAGPtr & out_projection);
 
diff --git a/src/Processors/QueryPlan/ReadFromRemote.cpp b/src/Processors/QueryPlan/ReadFromRemote.cpp
index cd88f5cc93a..0d1fae0d239 100644
--- a/src/Processors/QueryPlan/ReadFromRemote.cpp
+++ b/src/Processors/QueryPlan/ReadFromRemote.cpp
@@ -236,7 +236,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
     scalars["_shard_num"]
         = Block{{DataTypeUInt32().createColumnConst(1, shard.shard_info.shard_num), std::make_shared<DataTypeUInt32>(), "_shard_num"}};
 
-    if (context->canUseParallelReplicas())
+    if (context->canUseTaskBasedParallelReplicas())
     {
         if (context->getSettingsRef().cluster_for_parallel_replicas.changed)
         {
@@ -258,7 +258,7 @@ void ReadFromRemote::addPipe(Pipes & pipes, const ClusterProxy::SelectStreamFact
         shard.shard_info.pool, query_string, output_stream->header, context, throttler, scalars, external_tables, stage);
     remote_query_executor->setLogger(log);
 
-    if (context->canUseParallelReplicas())
+    if (context->canUseTaskBasedParallelReplicas())
     {
         // when doing parallel reading from replicas (ParallelReplicasMode::READ_TASKS) on a shard:
         // establish a connection to a replica on the shard, the replica will instantiate coordinator to manage parallel reading from replicas on the shard.
@@ -367,7 +367,9 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
             IConnections::ReplicaInfo replica_info
             {
                 .all_replicas_count = all_replicas_count,
-                .number_of_current_replica = 0
+                /// `shard_num` will be equal to the number of the given replica in the cluster (set by `Cluster::getClusterWithReplicasAsShards`).
+                /// we should use this number specifically because efficiency of data distribution by consistent hash depends on it.
+                .number_of_current_replica = shard.shard_num - 1,
             };
 
             addPipeForSingeReplica(pipes, shard.pool, replica_info);
@@ -386,7 +388,9 @@ void ReadFromParallelRemoteReplicasStep::initializePipeline(QueryPipelineBuilder
         IConnections::ReplicaInfo replica_info
         {
             .all_replicas_count = all_replicas_count,
-            .number_of_current_replica = pipes.size()
+            /// `shard_num` will be equal to the number of the given replica in the cluster (set by `Cluster::getClusterWithReplicasAsShards`).
+            /// we should use this number specifically because efficiency of data distribution by consistent hash depends on it.
+            .number_of_current_replica = current_shard->shard_num - 1,
         };
 
         addPipeForSingeReplica(pipes, current_shard->pool, replica_info);
diff --git a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
index 41690c1b132..ec43c647b77 100644
--- a/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
+++ b/src/Processors/QueryPlan/ReadFromSystemNumbersStep.cpp
@@ -374,7 +374,7 @@ Pipe ReadFromSystemNumbersStep::makePipe()
         num_streams = 1;
 
     /// Build rpn of query filters
-    KeyCondition condition(buildFilterDAG(), context, column_names, key_expression, NameSet{});
+    KeyCondition condition(buildFilterDAG(), context, column_names, key_expression);
 
     Pipe pipe;
     Ranges ranges;
diff --git a/src/Processors/SourceWithKeyCondition.h b/src/Processors/SourceWithKeyCondition.h
index d4b2d01c520..9e641cc8c51 100644
--- a/src/Processors/SourceWithKeyCondition.h
+++ b/src/Processors/SourceWithKeyCondition.h
@@ -41,8 +41,7 @@ protected:
                 filter_actions_dag,
                 context,
                 keys.getNames(),
-                std::make_shared<ExpressionActions>(std::make_shared<ActionsDAG>(keys.getColumnsWithTypeAndName())),
-                NameSet{});
+                std::make_shared<ExpressionActions>(std::make_shared<ActionsDAG>(keys.getColumnsWithTypeAndName())));
         }
     }
 
diff --git a/src/Processors/Sources/PostgreSQLSource.cpp b/src/Processors/Sources/PostgreSQLSource.cpp
index a4e81a081a4..4b828d6699c 100644
--- a/src/Processors/Sources/PostgreSQLSource.cpp
+++ b/src/Processors/Sources/PostgreSQLSource.cpp
@@ -199,7 +199,8 @@ PostgreSQLSource<T>::~PostgreSQLSource()
             tryLogCurrentException(__PRETTY_FUNCTION__);
         }
 
-        connection_holder->setBroken();
+        if (connection_holder)
+            connection_holder->setBroken();
     }
 }
 
diff --git a/src/Processors/Sources/ShellCommandSource.cpp b/src/Processors/Sources/ShellCommandSource.cpp
index 7933b342dec..1f23292c6b3 100644
--- a/src/Processors/Sources/ShellCommandSource.cpp
+++ b/src/Processors/Sources/ShellCommandSource.cpp
@@ -44,7 +44,7 @@ static void makeFdNonBlocking(int fd)
 {
     bool result = tryMakeFdNonBlocking(fd);
     if (!result)
-        throwFromErrno("Cannot set non-blocking mode of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot set non-blocking mode of pipe");
 }
 
 static bool tryMakeFdBlocking(int fd)
@@ -63,7 +63,7 @@ static void makeFdBlocking(int fd)
 {
     bool result = tryMakeFdBlocking(fd);
     if (!result)
-        throwFromErrno("Cannot set blocking mode of pipe", ErrorCodes::CANNOT_FCNTL);
+        throw ErrnoException(ErrorCodes::CANNOT_FCNTL, "Cannot set blocking mode of pipe");
 }
 
 static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_milliseconds)
@@ -78,7 +78,7 @@ static int pollWithTimeout(pollfd * pfds, size_t num, size_t timeout_millisecond
         if (res < 0)
         {
             if (errno != EINTR)
-                throwFromErrno("Cannot poll", ErrorCodes::CANNOT_POLL);
+                throw ErrnoException(ErrorCodes::CANNOT_POLL, "Cannot poll");
 
             const auto elapsed = watch.elapsedMilliseconds();
             if (timeout_milliseconds <= elapsed)
@@ -177,7 +177,7 @@ public:
                 ssize_t res = ::read(stdout_fd, internal_buffer.begin(), internal_buffer.size());
 
                 if (-1 == res && errno != EINTR)
-                    throwFromErrno("Cannot read from pipe", ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+                    throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, "Cannot read from pipe");
 
                 if (res == 0)
                     break;
@@ -261,7 +261,7 @@ public:
             ssize_t res = ::write(fd, working_buffer.begin() + bytes_written, offset() - bytes_written);
 
             if ((-1 == res || 0 == res) && errno != EINTR)
-                throwFromErrno("Cannot write into pipe", ErrorCodes::CANNOT_WRITE_TO_FILE_DESCRIPTOR);
+                throw ErrnoException(ErrorCodes::CANNOT_WRITE_TO_FILE_DESCRIPTOR, "Cannot write into pipe");
 
             if (res > 0)
                 bytes_written += res;
diff --git a/src/Processors/TTL/TTLAggregationAlgorithm.cpp b/src/Processors/TTL/TTLAggregationAlgorithm.cpp
index fa3436ec55d..2537e21dd40 100644
--- a/src/Processors/TTL/TTLAggregationAlgorithm.cpp
+++ b/src/Processors/TTL/TTLAggregationAlgorithm.cpp
@@ -30,8 +30,8 @@ TTLAggregationAlgorithm::TTLAggregationAlgorithm(
         false,
         settings.max_rows_to_group_by,
         settings.group_by_overflow_mode,
-        0,
-        0,
+        /*group_by_two_level_threshold*/0,
+        /*group_by_two_level_threshold_bytes*/0,
         settings.max_bytes_before_external_group_by,
         settings.empty_result_for_aggregation_by_empty_set,
         storage_.getContext()->getTempDataOnDisk(),
@@ -41,8 +41,10 @@ TTLAggregationAlgorithm::TTLAggregationAlgorithm(
         settings.min_count_to_compile_aggregate_expression,
         settings.max_block_size,
         settings.enable_software_prefetch_in_aggregation,
-        false /* only_merge */,
-        settings.optimize_group_by_constant_keys);
+        /*only_merge=*/ false,
+        settings.optimize_group_by_constant_keys,
+        settings.min_chunk_bytes_for_parallel_parsing,
+        /*stats_collecting_params=*/ {});
 
     aggregator = std::make_unique<Aggregator>(header, params);
 
@@ -98,7 +100,17 @@ void TTLAggregationAlgorithm::execute(Block & block)
                 }
             }
 
-            if (!same_as_current)
+            /// We are observing the row with new the aggregation key.
+            /// In this case we definitely need to finish the current aggregation for the previuos key and
+            /// write results to `result_columns`.
+            const bool observing_new_key = !same_as_current;
+            /// We are observing the row with the same aggregation key, but TTL is not expired anymore.
+            /// In this case we need to finish aggregation here. The current row has to be written as is.
+            const bool no_new_rows_to_aggregate_within_the_same_key = same_as_current && !ttl_expired;
+            /// The aggregation for this aggregation key is done.
+            const bool need_to_flush_aggregation_state = observing_new_key || no_new_rows_to_aggregate_within_the_same_key;
+
+            if (need_to_flush_aggregation_state)
             {
                 if (rows_with_current_key)
                 {
diff --git a/src/Processors/Transforms/AggregatingInOrderTransform.cpp b/src/Processors/Transforms/AggregatingInOrderTransform.cpp
index 4e9f7b7601a..a39a0db1311 100644
--- a/src/Processors/Transforms/AggregatingInOrderTransform.cpp
+++ b/src/Processors/Transforms/AggregatingInOrderTransform.cpp
@@ -3,6 +3,7 @@
 #include <Storages/SelectQueryInfo.h>
 #include <Core/SortCursor.h>
 #include <Common/logger_useful.h>
+#include <Common/formatReadable.h>
 #include <Interpreters/sortBlock.h>
 #include <base/range.h>
 
diff --git a/src/Processors/Transforms/AggregatingTransform.cpp b/src/Processors/Transforms/AggregatingTransform.cpp
index bf475c57d36..47d2c2c5cc6 100644
--- a/src/Processors/Transforms/AggregatingTransform.cpp
+++ b/src/Processors/Transforms/AggregatingTransform.cpp
@@ -6,6 +6,7 @@
 #include <Processors/Transforms/MergingAggregatedMemoryEfficientTransform.h>
 #include <Core/ProtocolDefines.h>
 #include <Common/logger_useful.h>
+#include <Common/formatReadable.h>
 
 #include <Processors/Transforms/SquashingChunksTransform.h>
 
@@ -123,7 +124,10 @@ protected:
         UInt32 bucket_num = shared_data->next_bucket_to_merge.fetch_add(1);
 
         if (bucket_num >= NUM_BUCKETS)
+        {
+            data.reset();
             return {};
+        }
 
         Block block = params->aggregator.mergeAndConvertOneBucketToBlock(*data, arena, params->final, bucket_num, &shared_data->is_cancelled);
         Chunk chunk = convertToChunk(block);
@@ -170,6 +174,8 @@ protected:
             return convertToChunk(block);
         }
 
+        variant.reset();
+
         return {};
     }
 
@@ -372,9 +378,7 @@ private:
         auto & output = outputs.front();
         auto chunk = std::move(single_level_chunks.back());
         single_level_chunks.pop_back();
-        const auto has_rows = chunk.hasRows();
-        if (has_rows)
-            output.push(std::move(chunk));
+        output.push(std::move(chunk));
 
         if (finished && single_level_chunks.empty())
         {
@@ -382,7 +386,7 @@ private:
             return Status::Finished;
         }
 
-        return has_rows ? Status::PortFull : Status::Ready;
+        return Status::PortFull;
     }
 
     /// Read all sources and try to push current bucket.
@@ -400,26 +404,28 @@ private:
             }
         }
 
-        if (!shared_data->is_bucket_processed[current_bucket_num])
-            return Status::NeedData;
-
-        if (!two_level_chunks[current_bucket_num])
-            return Status::NeedData;
-
-        auto chunk = std::move(two_level_chunks[current_bucket_num]);
-        const auto has_rows = chunk.hasRows();
-        if (has_rows)
-            output.push(std::move(chunk));
-
-        ++current_bucket_num;
-        if (current_bucket_num == NUM_BUCKETS)
+        while (current_bucket_num < NUM_BUCKETS)
         {
-            output.finish();
-            /// Do not close inputs, they must be finished.
-            return Status::Finished;
+            if (!shared_data->is_bucket_processed[current_bucket_num])
+                return Status::NeedData;
+
+            if (!two_level_chunks[current_bucket_num])
+                return Status::NeedData;
+
+            auto chunk = std::move(two_level_chunks[current_bucket_num]);
+            ++current_bucket_num;
+
+            const auto has_rows = chunk.hasRows();
+            if (has_rows)
+            {
+                output.push(std::move(chunk));
+                return Status::PortFull;
+            }
         }
 
-        return has_rows ? Status::PortFull : Status::Ready;
+        output.finish();
+        /// Do not close inputs, they must be finished.
+        return Status::Finished;
     }
 
     AggregatingTransformParamsPtr params;
@@ -459,7 +465,8 @@ private:
             auto block = params->aggregator.prepareBlockAndFillWithoutKey(
                 *first, params->final, first->type != AggregatedDataVariants::Type::without_key);
 
-            single_level_chunks.emplace_back(convertToChunk(block));
+            if (block.rows() > 0)
+                single_level_chunks.emplace_back(convertToChunk(block));
         }
     }
 
@@ -486,9 +493,11 @@ private:
 
         auto blocks = params->aggregator.prepareBlockAndFillSingleLevel</* return_single_block */ false>(*first, params->final);
         for (auto & block : blocks)
-            single_level_chunks.emplace_back(convertToChunk(block));
+            if (block.rows() > 0)
+                single_level_chunks.emplace_back(convertToChunk(block));
 
         finished = true;
+        data.reset();
     }
 
     void createSources()
@@ -504,6 +513,8 @@ private:
 
             processors.emplace_back(std::move(source));
         }
+
+        data.reset();
     }
 };
 
@@ -710,7 +721,12 @@ void AggregatingTransform::initGenerate()
     }
 
     if (many_data->num_finished.fetch_add(1) + 1 < many_data->variants.size())
+    {
+        /// Note: we reset aggregation state here to release memory earlier.
+        /// It might cause extra memory usage for complex queries othervise.
+        many_data.reset();
         return;
+    }
 
     if (!params->aggregator.hasTemporaryData())
     {
@@ -726,8 +742,11 @@ void AggregatingTransform::initGenerate()
             auto prepared_data = params->aggregator.prepareVariantsToMerge(many_data->variants);
             Pipes pipes;
             for (auto & variant : prepared_data)
+            {
                 /// Converts hash tables to blocks with data (finalized or not).
                 pipes.emplace_back(std::make_shared<ConvertingAggregatedToChunksSource>(params, variant));
+            }
+
             Pipe pipe = Pipe::unitePipes(std::move(pipes));
             if (!pipe.empty())
             {
@@ -781,21 +800,23 @@ void AggregatingTransform::initGenerate()
             }
         }
 
-        const auto & tmp_data = params->aggregator.getTemporaryData();
+        size_t num_streams = 0;
+        size_t compressed_size = 0;
+        size_t uncompressed_size = 0;
 
-        Pipe pipe;
+        Pipes pipes;
+        /// Merge external data from all aggregators used in query.
+        for (const auto & aggregator : *params->aggregator_list_ptr)
         {
-            Pipes pipes;
-
+            const auto & tmp_data = aggregator.getTemporaryData();
             for (auto * tmp_stream : tmp_data.getStreams())
                 pipes.emplace_back(Pipe(std::make_unique<SourceFromNativeStream>(tmp_stream)));
 
-            pipe = Pipe::unitePipes(std::move(pipes));
+            num_streams += tmp_data.getStreams().size();
+            compressed_size += tmp_data.getStat().compressed_size;
+            uncompressed_size += tmp_data.getStat().uncompressed_size;
         }
 
-        size_t num_streams = tmp_data.getStreams().size();
-        size_t compressed_size = tmp_data.getStat().compressed_size;
-        size_t uncompressed_size = tmp_data.getStat().uncompressed_size;
         LOG_DEBUG(
             log,
             "Will merge {} temporary files of size {} compressed, {} uncompressed.",
@@ -803,10 +824,13 @@ void AggregatingTransform::initGenerate()
             ReadableSize(compressed_size),
             ReadableSize(uncompressed_size));
 
+        auto pipe = Pipe::unitePipes(std::move(pipes));
         addMergingAggregatedMemoryEfficientTransform(pipe, params, temporary_data_merge_threads);
 
         processors = Pipe::detachProcessors(std::move(pipe));
     }
+
+    many_data.reset();
 }
 
 }
diff --git a/src/Processors/Transforms/CheckSortedTransform.cpp b/src/Processors/Transforms/CheckSortedTransform.cpp
index 4491301e274..a2ba8e21ba3 100644
--- a/src/Processors/Transforms/CheckSortedTransform.cpp
+++ b/src/Processors/Transforms/CheckSortedTransform.cpp
@@ -42,20 +42,33 @@ void CheckSortedTransform::transform(Chunk & chunk)
             else if (res > 0)
             {
                 throw Exception(ErrorCodes::LOGICAL_ERROR,
-                    "Sort order of blocks violated for column number {}, left: {}, right: {}.",
+                    "Sort order of blocks violated for column number {}, left: {}, right: {}. Chunk {}, rows read {}.{}",
                     column_number,
                     applyVisitor(FieldVisitorDump(), (*left_col)[left_index]),
-                    applyVisitor(FieldVisitorDump(), (*right_col)[right_index]));
+                    applyVisitor(FieldVisitorDump(), (*right_col)[right_index]),
+                    chunk_num, rows_read,
+                    description.empty() ? String() : fmt::format(" ({})", description));
             }
         }
     };
 
+    /// ColumnVector tries to cast the rhs column to the same type (ColumnVector) in compareAt method.
+    /// And it doesn't care about the possible incompatibilities in data types
+    /// (for example in case when the right column is ColumnSparse)
+    convertToFullIfSparse(chunk);
+
     const auto & chunk_columns = chunk.getColumns();
+
+    ++rows_read;
+
     if (!last_row.empty())
         check(last_row, 0, chunk_columns, 0);
 
     for (size_t i = 1; i < num_rows; ++i)
+    {
+        ++rows_read;
         check(chunk_columns, i - 1, chunk_columns, i);
+    }
 
     last_row.clear();
     for (const auto & chunk_column : chunk_columns)
@@ -64,6 +77,8 @@ void CheckSortedTransform::transform(Chunk & chunk)
         column->insertFrom(*chunk_column, num_rows - 1);
         last_row.emplace_back(std::move(column));
     }
+
+    ++chunk_num;
 }
 
 }
diff --git a/src/Processors/Transforms/CheckSortedTransform.h b/src/Processors/Transforms/CheckSortedTransform.h
index 4daaaf79fdf..07005bdeacd 100644
--- a/src/Processors/Transforms/CheckSortedTransform.h
+++ b/src/Processors/Transforms/CheckSortedTransform.h
@@ -13,7 +13,7 @@ public:
     CheckSortedTransform(const Block & header, const SortDescription & sort_description);
 
     String getName() const override { return "CheckSortedTransform"; }
-
+    void setDescription(const String & str) { description = str; }
 
 protected:
     void transform(Chunk & chunk) override;
@@ -21,5 +21,8 @@ protected:
 private:
     SortDescriptionWithPositions sort_description_map;
     Columns last_row;
+    String description;
+    size_t chunk_num = 0;
+    size_t rows_read = 0;
 };
 }
diff --git a/src/Processors/Transforms/FillingTransform.cpp b/src/Processors/Transforms/FillingTransform.cpp
index 6d6f4b87cef..b725c3e1a5f 100644
--- a/src/Processors/Transforms/FillingTransform.cpp
+++ b/src/Processors/Transforms/FillingTransform.cpp
@@ -1,5 +1,6 @@
 #include <Processors/Transforms/FillingTransform.h>
 #include <Interpreters/convertFieldToType.h>
+#include <Interpreters/ExpressionActions.h>
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeDateTime64.h>
 #include <DataTypes/IDataType.h>
diff --git a/src/Processors/Transforms/FillingTransform.h b/src/Processors/Transforms/FillingTransform.h
index 85da544ef2d..a8866a97103 100644
--- a/src/Processors/Transforms/FillingTransform.h
+++ b/src/Processors/Transforms/FillingTransform.h
@@ -9,6 +9,9 @@
 namespace DB
 {
 
+class ExpressionActions;
+using ExpressionActionsPtr = std::shared_ptr<ExpressionActions>;
+
 /** Implements modifier WITH FILL of ORDER BY clause.
  *  It fills gaps in data stream by rows with missing values in columns with set WITH FILL and default values in other columns.
  *  Optionally FROM, TO and STEP values can be specified.
diff --git a/src/Processors/Transforms/PasteJoinTransform.cpp b/src/Processors/Transforms/PasteJoinTransform.cpp
new file mode 100644
index 00000000000..ff3e2fb85e5
--- /dev/null
+++ b/src/Processors/Transforms/PasteJoinTransform.cpp
@@ -0,0 +1,127 @@
+#include <cassert>
+#include <cstddef>
+#include <limits>
+#include <memory>
+#include <type_traits>
+
+#include <base/defines.h>
+#include <base/types.h>
+
+#include <Common/logger_useful.h>
+#include <Columns/ColumnNullable.h>
+#include <Columns/ColumnsNumber.h>
+#include <Columns/IColumn.h>
+#include <IO/WriteHelpers.h>
+#include <Interpreters/TableJoin.h>
+#include <Parsers/ASTTablesInSelectQuery.h>
+#include <Processors/Transforms/PasteJoinTransform.h>
+
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int NOT_IMPLEMENTED;
+}
+
+
+PasteJoinAlgorithm::PasteJoinAlgorithm(
+    JoinPtr table_join_,
+    const Blocks & input_headers,
+    size_t max_block_size_)
+    : table_join(table_join_)
+    , max_block_size(max_block_size_)
+    , log(&Poco::Logger::get("PasteJoinAlgorithm"))
+{
+    if (input_headers.size() != 2)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "PasteJoinAlgorithm requires exactly two inputs");
+
+    auto strictness = table_join->getTableJoin().strictness();
+    if (strictness != JoinStrictness::Any && strictness != JoinStrictness::All)
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "PasteJoinAlgorithm is not implemented for strictness {}", strictness);
+
+    auto kind = table_join->getTableJoin().kind();
+    if (!isPaste(kind))
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "PasteJoinAlgorithm is not implemented for kind {}", kind);
+}
+
+static void prepareChunk(Chunk & chunk)
+{
+    if (!chunk)
+        return;
+
+    auto num_rows = chunk.getNumRows();
+    auto columns = chunk.detachColumns();
+
+    chunk.setColumns(std::move(columns), num_rows);
+}
+
+void PasteJoinAlgorithm::initialize(Inputs inputs)
+{
+    if (inputs.size() != 2)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Two inputs are required, got {}", inputs.size());
+
+    for (size_t i = 0; i < inputs.size(); ++i)
+    {
+        consume(inputs[i], i);
+    }
+}
+
+void PasteJoinAlgorithm::consume(Input & input, size_t source_num)
+{
+    if (input.skip_last_row)
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "skip_last_row is not supported");
+
+    if (input.permutation)
+        throw DB::Exception(ErrorCodes::NOT_IMPLEMENTED, "permutation is not supported");
+
+    last_used_row[source_num] = 0;
+
+    prepareChunk(input.chunk);
+    chunks[source_num] = std::move(input.chunk);
+}
+
+IMergingAlgorithm::Status PasteJoinAlgorithm::merge()
+{
+    if (chunks[0].empty() || chunks[1].empty())
+        return Status({}, true);
+    if (last_used_row[0] >= chunks[0].getNumRows())
+        return Status(0);
+    if (last_used_row[1] >= chunks[1].getNumRows())
+        return Status(1);
+    /// We have unused rows from both inputs
+    size_t result_num_rows = std::min(chunks[0].getNumRows() - last_used_row[0], chunks[1].getNumRows() - last_used_row[1]);
+
+    Chunk result;
+    for (size_t source_num = 0; source_num < 2; ++source_num)
+        for (const auto & col : chunks[source_num].getColumns())
+            result.addColumn(col->cut(last_used_row[source_num], result_num_rows));
+    last_used_row[0] += result_num_rows;
+    last_used_row[1] += result_num_rows;
+    return Status(std::move(result));
+}
+
+PasteJoinTransform::PasteJoinTransform(
+        JoinPtr table_join,
+        const Blocks & input_headers,
+        const Block & output_header,
+        size_t max_block_size,
+        UInt64 limit_hint_)
+    : IMergingTransform<PasteJoinAlgorithm>(
+        input_headers,
+        output_header,
+        /* have_all_inputs_= */ true,
+        limit_hint_,
+        /* always_read_till_end_= */ false,
+        /* empty_chunk_on_finish_= */ true,
+        table_join, input_headers, max_block_size)
+    , log(&Poco::Logger::get("PasteJoinTransform"))
+{
+    LOG_TRACE(log, "Use PasteJoinTransform");
+}
+
+void PasteJoinTransform::onFinish() {};
+
+}
diff --git a/src/Processors/Transforms/PasteJoinTransform.h b/src/Processors/Transforms/PasteJoinTransform.h
new file mode 100644
index 00000000000..7ecf70e18dc
--- /dev/null
+++ b/src/Processors/Transforms/PasteJoinTransform.h
@@ -0,0 +1,88 @@
+#pragma once
+#include <cassert>
+#include <cstddef>
+#include <memory>
+#include <mutex>
+#include <utility>
+
+#include <boost/core/noncopyable.hpp>
+
+#include <Common/PODArray.h>
+#include <IO/ReadBuffer.h>
+#include <Parsers/ASTTablesInSelectQuery.h>
+#include <Processors/Chunk.h>
+#include <Processors/Merges/Algorithms/IMergingAlgorithm.h>
+#include <Processors/Merges/IMergingTransform.h>
+
+namespace Poco { class Logger; }
+
+namespace DB
+{
+
+class IJoin;
+using JoinPtr = std::shared_ptr<IJoin>;
+
+/*
+ * This class is used to join chunks from two sorted streams.
+ * It is used in MergeJoinTransform.
+ */
+class PasteJoinAlgorithm final : public IMergingAlgorithm
+{
+public:
+    explicit PasteJoinAlgorithm(JoinPtr table_join, const Blocks & input_headers, size_t max_block_size_);
+
+    const char * getName() const override { return "PasteJoinAlgorithm"; }
+    virtual void initialize(Inputs inputs) override;
+    virtual void consume(Input & input, size_t source_num) override;
+    virtual Status merge() override;
+
+    void logElapsed(double seconds);
+
+private:
+    Chunk createBlockWithDefaults(size_t source_num);
+    Chunk createBlockWithDefaults(size_t source_num, size_t start, size_t num_rows) const;
+
+    /// For `USING` join key columns should have values from right side instead of defaults
+    std::unordered_map<size_t, size_t> left_to_right_key_remap;
+
+    std::array<Chunk, 2> chunks;
+
+    JoinPtr table_join;
+
+    size_t max_block_size;
+
+    struct Statistic
+    {
+        size_t num_blocks[2] = {0, 0};
+        size_t num_rows[2] = {0, 0};
+
+        size_t max_blocks_loaded = 0;
+    };
+
+    Statistic stat;
+
+    Poco::Logger * log;
+    UInt64 last_used_row[2] = {0, 0};
+};
+
+class PasteJoinTransform final : public IMergingTransform<PasteJoinAlgorithm>
+{
+    using Base = IMergingTransform<PasteJoinAlgorithm>;
+
+public:
+    PasteJoinTransform(
+        JoinPtr table_join,
+        const Blocks & input_headers,
+        const Block & output_header,
+        size_t max_block_size,
+        UInt64 limit_hint = 0);
+
+    String getName() const override { return "PasteJoinTransform"; }
+
+protected:
+    void onFinish() override;
+
+    Poco::Logger * log;
+};
+
+}
diff --git a/src/Processors/Transforms/WindowTransform.cpp b/src/Processors/Transforms/WindowTransform.cpp
index 7afc7a38aab..47b5b900400 100644
--- a/src/Processors/Transforms/WindowTransform.cpp
+++ b/src/Processors/Transforms/WindowTransform.cpp
@@ -67,7 +67,7 @@ public:
 
     // Must insert the result for current_row.
     virtual void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) = 0;
+        size_t function_index) const = 0;
 
     virtual std::optional<WindowFrame> getDefaultFrame() const { return {}; }
 };
@@ -1463,7 +1463,7 @@ struct WindowFunctionRank final : public WindowFunction
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         IColumn & to = *transform->blockAt(transform->current_row)
             .output_columns[function_index];
@@ -1482,7 +1482,7 @@ struct WindowFunctionDenseRank final : public WindowFunction
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         IColumn & to = *transform->blockAt(transform->current_row)
             .output_columns[function_index];
@@ -1561,7 +1561,7 @@ struct StatefulWindowFunction : public WindowFunction
 
     bool hasTrivialDestructor() const override { return std::is_trivially_destructible_v<State>; }
 
-    State & getState(const WindowFunctionWorkspace & workspace)
+    State & getState(const WindowFunctionWorkspace & workspace) const
     {
         return *static_cast<State *>(static_cast<void *>(workspace.aggregate_function_state.data()));
     }
@@ -1585,17 +1585,21 @@ struct WindowFunctionExponentialTimeDecayedSum final : public StatefulWindowFunc
     static constexpr size_t ARGUMENT_VALUE = 0;
     static constexpr size_t ARGUMENT_TIME = 1;
 
-    WindowFunctionExponentialTimeDecayedSum(const std::string & name_,
-            const DataTypes & argument_types_, const Array & parameters_)
-        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+    static Float64 getDecayLength(const Array & parameters_, const std::string & name_)
     {
         if (parameters_.size() != 1)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                 "Function {} takes exactly one parameter", name_);
         }
-        decay_length = applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+        return applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+    }
 
+    WindowFunctionExponentialTimeDecayedSum(const std::string & name_,
+            const DataTypes & argument_types_, const Array & parameters_)
+        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+        , decay_length(getDecayLength(parameters_, name_))
+    {
         if (argument_types.size() != 2)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
@@ -1622,7 +1626,7 @@ struct WindowFunctionExponentialTimeDecayedSum final : public StatefulWindowFunc
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         const auto & workspace = transform->workspaces[function_index];
         auto & state = getState(workspace);
@@ -1670,7 +1674,7 @@ struct WindowFunctionExponentialTimeDecayedSum final : public StatefulWindowFunc
     }
 
     private:
-        Float64 decay_length;
+        const Float64 decay_length;
 };
 
 struct WindowFunctionExponentialTimeDecayedMax final : public WindowFunction
@@ -1678,17 +1682,21 @@ struct WindowFunctionExponentialTimeDecayedMax final : public WindowFunction
     static constexpr size_t ARGUMENT_VALUE = 0;
     static constexpr size_t ARGUMENT_TIME = 1;
 
-    WindowFunctionExponentialTimeDecayedMax(const std::string & name_,
-            const DataTypes & argument_types_, const Array & parameters_)
-        : WindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+    static Float64 getDecayLength(const Array & parameters_, const std::string & name_)
     {
         if (parameters_.size() != 1)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                 "Function {} takes exactly one parameter", name_);
         }
-        decay_length = applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+        return applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+    }
 
+    WindowFunctionExponentialTimeDecayedMax(const std::string & name_,
+            const DataTypes & argument_types_, const Array & parameters_)
+        : WindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+        , decay_length(getDecayLength(parameters_, name_))
+    {
         if (argument_types.size() != 2)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
@@ -1715,7 +1723,7 @@ struct WindowFunctionExponentialTimeDecayedMax final : public WindowFunction
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         Float64 result = std::numeric_limits<Float64>::quiet_NaN();
 
@@ -1742,24 +1750,28 @@ struct WindowFunctionExponentialTimeDecayedMax final : public WindowFunction
     }
 
     private:
-        Float64 decay_length;
+        const Float64 decay_length;
 };
 
 struct WindowFunctionExponentialTimeDecayedCount final : public StatefulWindowFunction<ExponentialTimeDecayedSumState>
 {
     static constexpr size_t ARGUMENT_TIME = 0;
 
-    WindowFunctionExponentialTimeDecayedCount(const std::string & name_,
-            const DataTypes & argument_types_, const Array & parameters_)
-        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+    static Float64 getDecayLength(const Array & parameters_, const std::string & name_)
     {
         if (parameters_.size() != 1)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                 "Function {} takes exactly one parameter", name_);
         }
-        decay_length = applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+        return applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+    }
 
+    WindowFunctionExponentialTimeDecayedCount(const std::string & name_,
+            const DataTypes & argument_types_, const Array & parameters_)
+        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+        , decay_length(getDecayLength(parameters_, name_))
+    {
         if (argument_types.size() != 1)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
@@ -1778,7 +1790,7 @@ struct WindowFunctionExponentialTimeDecayedCount final : public StatefulWindowFu
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         const auto & workspace = transform->workspaces[function_index];
         auto & state = getState(workspace);
@@ -1823,7 +1835,7 @@ struct WindowFunctionExponentialTimeDecayedCount final : public StatefulWindowFu
     }
 
     private:
-        Float64 decay_length;
+        const Float64 decay_length;
 };
 
 struct WindowFunctionExponentialTimeDecayedAvg final : public StatefulWindowFunction<ExponentialTimeDecayedAvgState>
@@ -1831,17 +1843,21 @@ struct WindowFunctionExponentialTimeDecayedAvg final : public StatefulWindowFunc
     static constexpr size_t ARGUMENT_VALUE = 0;
     static constexpr size_t ARGUMENT_TIME = 1;
 
-    WindowFunctionExponentialTimeDecayedAvg(const std::string & name_,
-            const DataTypes & argument_types_, const Array & parameters_)
-        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+    static Float64 getDecayLength(const Array & parameters_, const std::string & name_)
     {
         if (parameters_.size() != 1)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
                 "Function {} takes exactly one parameter", name_);
         }
-        decay_length = applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+        return applyVisitor(FieldVisitorConvertToNumber<Float64>(), parameters_[0]);
+    }
 
+    WindowFunctionExponentialTimeDecayedAvg(const std::string & name_,
+            const DataTypes & argument_types_, const Array & parameters_)
+        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+        , decay_length(getDecayLength(parameters_, name_))
+    {
         if (argument_types.size() != 2)
         {
             throw Exception(ErrorCodes::BAD_ARGUMENTS,
@@ -1868,7 +1884,7 @@ struct WindowFunctionExponentialTimeDecayedAvg final : public StatefulWindowFunc
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         const auto & workspace = transform->workspaces[function_index];
         auto & state = getState(workspace);
@@ -1933,7 +1949,7 @@ struct WindowFunctionExponentialTimeDecayedAvg final : public StatefulWindowFunc
     }
 
     private:
-        Float64 decay_length;
+        const Float64 decay_length;
 };
 
 struct WindowFunctionRowNumber final : public WindowFunction
@@ -1946,7 +1962,7 @@ struct WindowFunctionRowNumber final : public WindowFunction
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         IColumn & to = *transform->blockAt(transform->current_row)
             .output_columns[function_index];
@@ -1955,12 +1971,30 @@ struct WindowFunctionRowNumber final : public WindowFunction
     }
 };
 
+namespace
+{
+    struct NtileState
+    {
+        UInt64 buckets = 0;
+        RowNumber start_row;
+        UInt64 current_partition_rows = 0;
+        UInt64 current_partition_inserted_row = 0;
+
+        void windowInsertResultInto(
+            const WindowTransform * transform,
+            size_t function_index,
+            const DataTypes & argument_types);
+
+        static void checkWindowFrameType(const WindowTransform * transform);
+    };
+}
+
 // Usage: ntile(n). n is the number of buckets.
-struct WindowFunctionNtile final : public WindowFunction
+struct WindowFunctionNtile final : public StatefulWindowFunction<NtileState>
 {
     WindowFunctionNtile(const std::string & name_,
             const DataTypes & argument_types_, const Array & parameters_)
-        : WindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeUInt64>())
+        : StatefulWindowFunction<NtileState>(name_, argument_types_, parameters_, std::make_shared<DataTypeUInt64>())
     {
         if (argument_types.size() != 1)
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Function {} takes exactly one argument", name_);
@@ -1981,7 +2015,20 @@ struct WindowFunctionNtile final : public WindowFunction
     }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
+    {
+        const auto & workspace = transform->workspaces[function_index];
+        auto & state = getState(workspace);
+        state.windowInsertResultInto(transform, function_index, argument_types);
+    }
+};
+
+namespace
+{
+    void NtileState::windowInsertResultInto(
+        const WindowTransform * transform,
+        size_t function_index,
+        const DataTypes & argument_types)
     {
         if (!buckets) [[unlikely]]
         {
@@ -2072,13 +2119,8 @@ struct WindowFunctionNtile final : public WindowFunction
             bucket_num += 1;
         }
     }
-private:
-    UInt64 buckets = 0;
-    RowNumber start_row;
-    UInt64 current_partition_rows = 0;
-    UInt64 current_partition_inserted_row = 0;
 
-    static void checkWindowFrameType(const WindowTransform * transform)
+    void NtileState::checkWindowFrameType(const WindowTransform * transform)
     {
         if (transform->order_by_indices.empty())
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Window frame for 'ntile' function must have ORDER BY clause");
@@ -2093,7 +2135,7 @@ private:
             throw Exception(ErrorCodes::BAD_ARGUMENTS, "Window frame for function 'ntile' should be 'ROWS BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING'");
         }
     }
-};
+}
 
 // ClickHouse-specific variant of lag/lead that respects the window frame.
 template <bool is_lead>
@@ -2165,7 +2207,7 @@ struct WindowFunctionLagLeadInFrame final : public WindowFunction
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         const auto & current_block = transform->blockAt(transform->current_row);
         IColumn & to = *current_block.output_columns[function_index];
@@ -2255,7 +2297,7 @@ struct WindowFunctionNthValue final : public WindowFunction
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-        size_t function_index) override
+        size_t function_index) const override
     {
         const auto & current_block = transform->blockAt(transform->current_row);
         IColumn & to = *current_block.output_columns[function_index];
@@ -2298,16 +2340,18 @@ struct NonNegativeDerivativeState
     Float64 previous_timestamp = 0;
 };
 
-// nonNegativeDerivative(metric_column, timestamp_column[, INTERVAL 1 SECOND])
-struct WindowFunctionNonNegativeDerivative final : public StatefulWindowFunction<NonNegativeDerivativeState>
+struct NonNegativeDerivativeParams
 {
     static constexpr size_t ARGUMENT_METRIC = 0;
     static constexpr size_t ARGUMENT_TIMESTAMP = 1;
     static constexpr size_t ARGUMENT_INTERVAL = 2;
 
-    WindowFunctionNonNegativeDerivative(const std::string & name_,
-                                            const DataTypes & argument_types_, const Array & parameters_)
-        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+    Float64 interval_length = 1;
+    bool interval_specified = false;
+    Int64 ts_scale_multiplier = 0;
+
+    NonNegativeDerivativeParams(
+        const std::string & name_, const DataTypes & argument_types, const Array & parameters)
     {
         if (!parameters.empty())
         {
@@ -2365,11 +2409,23 @@ struct WindowFunctionNonNegativeDerivative final : public StatefulWindowFunction
             interval_specified = true;
         }
     }
+};
+
+// nonNegativeDerivative(metric_column, timestamp_column[, INTERVAL 1 SECOND])
+struct WindowFunctionNonNegativeDerivative final : public StatefulWindowFunction<NonNegativeDerivativeState>, public NonNegativeDerivativeParams
+{
+    using Params = NonNegativeDerivativeParams;
+
+    WindowFunctionNonNegativeDerivative(const std::string & name_,
+                                            const DataTypes & argument_types_, const Array & parameters_)
+        : StatefulWindowFunction(name_, argument_types_, parameters_, std::make_shared<DataTypeFloat64>())
+        , NonNegativeDerivativeParams(name, argument_types, parameters)
+    {}
 
     bool allocatesMemoryInArena() const override { return false; }
 
     void windowInsertResultInto(const WindowTransform * transform,
-                                size_t function_index) override
+                                size_t function_index) const override
     {
         const auto & current_block = transform->blockAt(transform->current_row);
         const auto & workspace = transform->workspaces[function_index];
@@ -2405,10 +2461,6 @@ struct WindowFunctionNonNegativeDerivative final : public StatefulWindowFunction
 
         WindowFunctionHelpers::setValueToOutputColumn<Float64>(transform, function_index, result >= 0 ? result : 0);
     }
-private:
-    Float64 interval_length = 1;
-    bool interval_specified = false;
-    Int64 ts_scale_multiplier = 0;
 };
 
 
diff --git a/src/Processors/Transforms/buildPushingToViewsChain.cpp b/src/Processors/Transforms/buildPushingToViewsChain.cpp
index ea10b025e87..f85dc28f4c7 100644
--- a/src/Processors/Transforms/buildPushingToViewsChain.cpp
+++ b/src/Processors/Transforms/buildPushingToViewsChain.cpp
@@ -341,7 +341,7 @@ Chain buildPushingToViewsChain(
             if (select_context->getSettingsRef().allow_experimental_analyzer)
                 header = InterpreterSelectQueryAnalyzer::getSampleBlock(query, select_context);
             else
-                header = InterpreterSelectQuery(query, select_context, SelectQueryOptions().analyze()).getSampleBlock();
+                header = InterpreterSelectQuery(query, select_context, SelectQueryOptions()).getSampleBlock();
 
             /// Insert only columns returned by select.
             Names insert_columns;
@@ -349,7 +349,7 @@ Chain buildPushingToViewsChain(
             for (const auto & column : header)
             {
                 /// But skip columns which storage doesn't have.
-                if (inner_table_columns.hasPhysical(column.name))
+                if (inner_table_columns.hasNotAlias(column.name))
                     insert_columns.emplace_back(column.name);
             }
 
diff --git a/src/QueryPipeline/Pipe.cpp b/src/QueryPipeline/Pipe.cpp
index b1c82d7a7e8..8050c7cc671 100644
--- a/src/QueryPipeline/Pipe.cpp
+++ b/src/QueryPipeline/Pipe.cpp
@@ -435,94 +435,42 @@ void Pipe::addTransform(ProcessorPtr transform)
 
 void Pipe::addTransform(ProcessorPtr transform, OutputPort * totals, OutputPort * extremes)
 {
-    if (output_ports.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform to empty Pipe");
-
-    auto & inputs = transform->getInputs();
-    if (inputs.size() != output_ports.size())
-        throw Exception(
-            ErrorCodes::LOGICAL_ERROR,
-            "Cannot add transform {} to Pipe because it has {} input ports, but {} expected",
-            transform->getName(),
-            inputs.size(),
-            output_ports.size());
-
-    if (totals && totals_port)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform with totals to Pipe because it already has totals");
-
-    if (extremes && extremes_port)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform with extremes to Pipe because it already has extremes");
-
-    if (totals)
-        totals_port = totals;
-    if (extremes)
-        extremes_port = extremes;
-
-    size_t next_output = 0;
-    for (auto & input : inputs)
-    {
-        connect(*output_ports[next_output], input);
-        ++next_output;
-    }
-
-    auto & outputs = transform->getOutputs();
-
-    output_ports.clear();
-    output_ports.reserve(outputs.size());
-
-    bool found_totals = false;
-    bool found_extremes = false;
-
-    for (auto & output : outputs)
-    {
-        if (&output == totals)
-            found_totals = true;
-        else if (&output == extremes)
-            found_extremes = true;
-        else
-            output_ports.emplace_back(&output);
-    }
-
-    if (totals && !found_totals)
-        throw Exception(ErrorCodes::LOGICAL_ERROR,
-                        "Cannot add transform {} to Pipes because specified totals port does not belong to it",
-                        transform->getName());
-
-    if (extremes && !found_extremes)
-        throw Exception(ErrorCodes::LOGICAL_ERROR,
-                        "Cannot add transform {} to Pipes because specified extremes port does not belong to it",
-                        transform->getName());
-
-    if (output_ports.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform {} to Pipes because it has no outputs",
-                        transform->getName());
-
-    header = output_ports.front()->getHeader();
-    for (size_t i = 1; i < output_ports.size(); ++i)
-        assertBlocksHaveEqualStructure(header, output_ports[i]->getHeader(), "Pipes");
-
-    // Temporarily skip this check. TotalsHavingTransform may return finalized totals but not finalized data.
-    // if (totals_port)
-    //     assertBlocksHaveEqualStructure(header, totals_port->getHeader(), "Pipes");
-
-    if (extremes_port)
-        assertBlocksHaveEqualStructure(header, extremes_port->getHeader(), "Pipes");
-
-    if (collected_processors)
-        collected_processors->emplace_back(transform);
-
-    processors->emplace_back(std::move(transform));
-
-    max_parallel_streams = std::max<size_t>(max_parallel_streams, output_ports.size());
+    addTransform(std::move(transform),
+        static_cast<InputPort *>(nullptr), static_cast<InputPort *>(nullptr),
+        totals, extremes);
 }
 
 void Pipe::addTransform(ProcessorPtr transform, InputPort * totals, InputPort * extremes)
+{
+    addTransform(std::move(transform),
+        totals, extremes,
+        static_cast<OutputPort *>(nullptr), static_cast<OutputPort *>(nullptr));
+}
+
+void Pipe::addTransform(
+    ProcessorPtr transform,
+    InputPort * totals_in, InputPort * extremes_in,
+    OutputPort * totals_out, OutputPort * extremes_out)
 {
     if (output_ports.empty())
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform to empty Pipe");
 
+    if (totals_in && !totals_port)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform consuming totals to Pipe because Pipe does not have totals");
+
+    if (extremes_in && !extremes_port)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform consuming extremes to Pipe because Pipe does not have extremes");
+
+    if (totals_out && !totals_in && totals_port)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform with totals to Pipe because it already has totals");
+
+    if (extremes_out && !extremes_in && extremes_port)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform with extremes to Pipe because it already has extremes");
+
     auto & inputs = transform->getInputs();
-    size_t expected_inputs = output_ports.size() + (totals ? 1 : 0) + (extremes ? 1 : 0);
+    auto & outputs = transform->getOutputs();
+
+    size_t expected_inputs = output_ports.size() + (totals_in ? 1 : 0) + (extremes_in ? 1 : 0);
     if (inputs.size() != expected_inputs)
         throw Exception(
             ErrorCodes::LOGICAL_ERROR,
@@ -531,68 +479,93 @@ void Pipe::addTransform(ProcessorPtr transform, InputPort * totals, InputPort *
             inputs.size(),
             expected_inputs);
 
-    if (totals && !totals_port)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform consuming totals to Pipe because Pipe does not have totals");
+    if (outputs.size() <= (totals_out ? 1 : 0) + (extremes_out ? 1 : 0))
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform {} to Pipes because it has no outputs",
+                        transform->getName());
 
-    if (extremes && !extremes_port)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform consuming extremes to Pipe because Pipe does not have extremes");
+    bool found_totals_in = false;
+    bool found_extremes_in = false;
 
-    if (totals)
+    for (auto & input : inputs)
     {
-        connect(*totals_port, *totals);
+        if (&input == totals_in)
+            found_totals_in = true;
+        else if (&input == extremes_in)
+            found_extremes_in = true;
+    }
+
+    if (totals_in && !found_totals_in)
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Cannot add transform {} to Pipes because specified totals port does not belong to it",
+            transform->getName());
+
+    if (extremes_in && !found_extremes_in)
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Cannot add transform {} to Pipes because specified extremes port does not belong to it",
+            transform->getName());
+
+    bool found_totals_out = false;
+    bool found_extremes_out = false;
+
+    for (auto & output : outputs)
+    {
+        if (&output == totals_out)
+            found_totals_out = true;
+        else if (&output == extremes_out)
+            found_extremes_out = true;
+    }
+
+    if (totals_out && !found_totals_out)
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot add transform {} to Pipes because specified totals port does not belong to it",
+                        transform->getName());
+
+    if (extremes_out && !found_extremes_out)
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Cannot add transform {} to Pipes because specified extremes port does not belong to it",
+                        transform->getName());
+
+    if (totals_in)
+    {
+        connect(*totals_port, *totals_in);
         totals_port = nullptr;
     }
-    if (extremes)
+    if (extremes_in)
     {
-        connect(*extremes_port, *extremes);
+        connect(*extremes_port, *extremes_in);
         extremes_port = nullptr;
     }
 
-    bool found_totals = false;
-    bool found_extremes = false;
+    totals_port = totals_out ? totals_out : totals_port;
+    extremes_port = extremes_out ? extremes_out : extremes_port;
 
     size_t next_output = 0;
     for (auto & input : inputs)
     {
-        if (&input == totals)
-            found_totals = true;
-        else if (&input == extremes)
-            found_extremes = true;
-        else
+        if (&input != totals_in && &input != extremes_in)
         {
             connect(*output_ports[next_output], input);
             ++next_output;
         }
     }
 
-    if (totals && !found_totals)
-        throw Exception(
-            ErrorCodes::LOGICAL_ERROR,
-            "Cannot add transform {} to Pipes because specified totals port does not belong to it",
-            transform->getName());
-
-    if (extremes && !found_extremes)
-        throw Exception(
-            ErrorCodes::LOGICAL_ERROR,
-            "Cannot add transform {} to Pipes because specified extremes port does not belong to it",
-            transform->getName());
-
-    auto & outputs = transform->getOutputs();
-    if (outputs.empty())
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Cannot add transform {} to Pipes because it has no outputs", transform->getName());
-
     output_ports.clear();
     output_ports.reserve(outputs.size());
-
     for (auto & output : outputs)
-        output_ports.emplace_back(&output);
+    {
+        if (&output != totals_out && &output != extremes_out)
+            output_ports.emplace_back(&output);
+    }
 
     header = output_ports.front()->getHeader();
     for (size_t i = 1; i < output_ports.size(); ++i)
         assertBlocksHaveEqualStructure(header, output_ports[i]->getHeader(), "Pipes");
 
-    if (totals_port)
-        assertBlocksHaveEqualStructure(header, totals_port->getHeader(), "Pipes");
+    // Temporarily skip this check. TotalsHavingTransform may return finalized totals but not finalized data.
+    // if (totals_port)
+    //     assertBlocksHaveEqualStructure(header, totals_port->getHeader(), "Pipes");
 
     if (extremes_port)
         assertBlocksHaveEqualStructure(header, extremes_port->getHeader(), "Pipes");
diff --git a/src/QueryPipeline/Pipe.h b/src/QueryPipeline/Pipe.h
index 09931e38578..ec102605677 100644
--- a/src/QueryPipeline/Pipe.h
+++ b/src/QueryPipeline/Pipe.h
@@ -69,6 +69,11 @@ public:
     void addTransform(ProcessorPtr transform, OutputPort * totals, OutputPort * extremes);
     void addTransform(ProcessorPtr transform, InputPort * totals, InputPort * extremes);
 
+    void addTransform(
+        ProcessorPtr transform,
+        InputPort * totals_in, InputPort * extremes_in,
+        OutputPort * totals_out, OutputPort * extremes_out);
+
     enum class StreamType
     {
         Main = 0, /// Stream for query data. There may be several streams of this type.
diff --git a/src/QueryPipeline/QueryPipeline.h b/src/QueryPipeline/QueryPipeline.h
index f14cf61aac2..48dff7b85a6 100644
--- a/src/QueryPipeline/QueryPipeline.h
+++ b/src/QueryPipeline/QueryPipeline.h
@@ -167,6 +167,7 @@ private:
     friend class PushingAsyncPipelineExecutor;
     friend class PullingAsyncPipelineExecutor;
     friend class CompletedPipelineExecutor;
+    friend class RefreshTask;
     friend class QueryPipelineBuilder;
 };
 
diff --git a/src/QueryPipeline/QueryPipelineBuilder.cpp b/src/QueryPipeline/QueryPipelineBuilder.cpp
index f13d1c56d7f..a0fabe3273c 100644
--- a/src/QueryPipeline/QueryPipelineBuilder.cpp
+++ b/src/QueryPipeline/QueryPipelineBuilder.cpp
@@ -25,6 +25,7 @@
 #include <Processors/Transforms/ExtremesTransform.h>
 #include <Processors/Transforms/JoiningTransform.h>
 #include <Processors/Transforms/MergeJoinTransform.h>
+#include <Processors/Transforms/PasteJoinTransform.h>
 #include <Processors/Transforms/MergingAggregatedMemoryEfficientTransform.h>
 #include <Processors/Transforms/PartialSortingTransform.h>
 #include <Processors/Transforms/TotalsHavingTransform.h>
@@ -36,6 +37,7 @@ namespace ErrorCodes
 {
     extern const int LOGICAL_ERROR;
     extern const int NOT_IMPLEMENTED;
+    extern const int BAD_ARGUMENTS;
 }
 
 void QueryPipelineBuilder::checkInitialized()
@@ -354,7 +356,9 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesYShaped
 
     left->pipe.dropExtremes();
     right->pipe.dropExtremes();
-    if (left->getNumStreams() != 1 || right->getNumStreams() != 1)
+    if ((left->getNumStreams() != 1 || right->getNumStreams() != 1) && join->getTableJoin().kind() == JoinKind::Paste)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Paste JOIN requires sorted tables only");
+    else if (left->getNumStreams() != 1 || right->getNumStreams() != 1)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Join is supported only for pipelines with one output port");
 
     if (left->hasTotals() || right->hasTotals())
@@ -362,9 +366,16 @@ std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesYShaped
 
     Blocks inputs = {left->getHeader(), right->getHeader()};
 
-    auto joining = std::make_shared<MergeJoinTransform>(join, inputs, out_header, max_block_size);
-
-    return mergePipelines(std::move(left), std::move(right), std::move(joining), collected_processors);
+    if (join->getTableJoin().kind() == JoinKind::Paste)
+    {
+        auto joining = std::make_shared<PasteJoinTransform>(join, inputs, out_header, max_block_size);
+        return mergePipelines(std::move(left), std::move(right), std::move(joining), collected_processors);
+    }
+    else
+    {
+        auto joining = std::make_shared<MergeJoinTransform>(join, inputs, out_header, max_block_size);
+        return mergePipelines(std::move(left), std::move(right), std::move(joining), collected_processors);
+    }
 }
 
 std::unique_ptr<QueryPipelineBuilder> QueryPipelineBuilder::joinPipelinesRightLeft(
@@ -602,7 +613,12 @@ void QueryPipelineBuilder::addPipelineBefore(QueryPipelineBuilder pipeline)
         throw Exception(ErrorCodes::LOGICAL_ERROR, "Pipeline for CreatingSets should have empty header. Got: {}",
                         pipeline.getHeader().dumpStructure());
 
-    IProcessor::PortNumbers delayed_streams(pipe.numOutputPorts());
+    pipeline.dropTotalsAndExtremes();
+
+    bool has_totals = pipe.getTotalsPort();
+    bool has_extremes = pipe.getExtremesPort();
+    size_t num_extra_ports = (has_totals ? 1 : 0) + (has_extremes ? 1 : 0);
+    IProcessor::PortNumbers delayed_streams(pipe.numOutputPorts() + num_extra_ports);
     for (size_t i = 0; i < delayed_streams.size(); ++i)
         delayed_streams[i] = i;
 
@@ -613,8 +629,14 @@ void QueryPipelineBuilder::addPipelineBefore(QueryPipelineBuilder pipeline)
     pipes.emplace_back(QueryPipelineBuilder::getPipe(std::move(pipeline), resources));
     pipe = Pipe::unitePipes(std::move(pipes), collected_processors, true);
 
-    auto processor = std::make_shared<DelayedPortsProcessor>(getHeader(), pipe.numOutputPorts(), delayed_streams, true);
-    addTransform(std::move(processor));
+    auto processor = std::make_shared<DelayedPortsProcessor>(getHeader(), pipe.numOutputPorts() + num_extra_ports, delayed_streams, true);
+    auto in = processor->getInputs().begin();
+    auto out = processor->getOutputs().begin();
+    InputPort * totals_in = has_totals ? &*(in++) : nullptr;
+    InputPort * extremes_in = has_extremes ? &*(in++) : nullptr;
+    OutputPort * totals_out = has_totals ? &*(out++) : nullptr;
+    OutputPort * extremes_out = has_extremes ? &*(out++) : nullptr;
+    pipe.addTransform(std::move(processor), totals_in, extremes_in, totals_out, extremes_out);
 }
 
 void QueryPipelineBuilder::setProcessListElement(QueryStatusPtr elem)
diff --git a/src/QueryPipeline/RemoteQueryExecutorReadContext.cpp b/src/QueryPipeline/RemoteQueryExecutorReadContext.cpp
index 5e211bf036d..5a78baae53c 100644
--- a/src/QueryPipeline/RemoteQueryExecutorReadContext.cpp
+++ b/src/QueryPipeline/RemoteQueryExecutorReadContext.cpp
@@ -22,7 +22,7 @@ RemoteQueryExecutorReadContext::RemoteQueryExecutorReadContext(RemoteQueryExecut
     : AsyncTaskExecutor(std::make_unique<Task>(*this)), executor(executor_), suspend_when_query_sent(suspend_when_query_sent_)
 {
     if (-1 == pipe2(pipe_fd, O_NONBLOCK))
-        throwFromErrno("Cannot create pipe", ErrorCodes::CANNOT_OPEN_FILE);
+        throw ErrnoException(ErrorCodes::CANNOT_OPEN_FILE, "Cannot create pipe");
 
     epoll.add(pipe_fd[0]);
     epoll.add(timer.getDescriptor());
@@ -132,7 +132,7 @@ void RemoteQueryExecutorReadContext::cancelBefore()
             break;
 
         if (errno != EINTR)
-            throwFromErrno("Cannot write to pipe", ErrorCodes::CANNOT_READ_FROM_SOCKET);
+            throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_SOCKET, "Cannot write to pipe");
     }
 }
 
diff --git a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
index ac722656899..1a12c09a8c7 100644
--- a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
+++ b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.cpp
@@ -136,7 +136,7 @@ void WriteBufferFromHTTPServerResponse::nextImpl()
 WriteBufferFromHTTPServerResponse::WriteBufferFromHTTPServerResponse(
     HTTPServerResponse & response_,
     bool is_http_method_head_,
-    size_t keep_alive_timeout_,
+    UInt64 keep_alive_timeout_,
     bool compress_,
     CompressionMethod compression_method_)
     : BufferWithOwnMemory<WriteBuffer>(DBMS_DEFAULT_BUFFER_SIZE)
diff --git a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
index 94202e1e0e8..38345f27952 100644
--- a/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
+++ b/src/Server/HTTP/WriteBufferFromHTTPServerResponse.h
@@ -36,7 +36,7 @@ public:
     WriteBufferFromHTTPServerResponse(
         HTTPServerResponse & response_,
         bool is_http_method_head_,
-        size_t keep_alive_timeout_,
+        UInt64 keep_alive_timeout_,
         bool compress_ = false,        /// If true - set Content-Encoding header and compress the result.
         CompressionMethod compression_method_ = CompressionMethod::None);
 
diff --git a/src/Server/HTTPHandler.cpp b/src/Server/HTTPHandler.cpp
index d63b82d392e..f53c0094ef7 100644
--- a/src/Server/HTTPHandler.cpp
+++ b/src/Server/HTTPHandler.cpp
@@ -45,7 +45,6 @@
 #include <Poco/StreamCopier.h>
 #include <Poco/String.h>
 #include <Poco/Net/SocketAddress.h>
-#include <Poco/Net/NameValueCollection.h>
 
 #include <chrono>
 #include <sstream>
@@ -503,7 +502,7 @@ bool HTTPHandler::authenticateUser(
     else if (request.getMethod() == HTTPServerRequest::HTTP_POST)
         http_method = ClientInfo::HTTPMethod::POST;
 
-    session->setHttpClientInfo(http_method, request.get("User-Agent", ""), request.get("Referer", ""), request);
+    session->setHttpClientInfo(http_method, request.get("User-Agent", ""), request.get("Referer", ""));
     session->setForwardedFor(request.get("X-Forwarded-For", ""));
     session->setQuotaClientKey(quota_key);
 
@@ -617,12 +616,10 @@ void HTTPHandler::processQuery(
     size_t buffer_size_http = DBMS_DEFAULT_BUFFER_SIZE;
     size_t buffer_size_memory = (buffer_size_total > buffer_size_http) ? buffer_size_total : 0;
 
-    unsigned keep_alive_timeout = config.getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT);
-
     used_output.out = std::make_shared<WriteBufferFromHTTPServerResponse>(
         response,
         request.getMethod() == HTTPRequest::HTTP_HEAD,
-        keep_alive_timeout,
+        context->getServerSettings().keep_alive_timeout.totalSeconds(),
         client_supports_http_compression,
         http_response_compression_method);
 
@@ -732,8 +729,8 @@ void HTTPHandler::processQuery(
     /// to some other value.
     const auto & settings = context->getSettingsRef();
 
-    /// Only readonly queries are allowed for HTTP GET requests.
-    if (request.getMethod() == HTTPServerRequest::HTTP_GET)
+    /// Anything else beside HTTP POST should be readonly queries.
+    if (request.getMethod() != HTTPServerRequest::HTTP_POST)
     {
         if (settings.readonly == 0)
             context->setSetting("readonly", 2);
@@ -1062,8 +1059,13 @@ void HTTPHandler::handleRequest(HTTPServerRequest & request, HTTPServerResponse
             response.setChunkedTransferEncoding(true);
 
         HTMLForm params(default_settings, request);
-        with_stacktrace = params.getParsed<bool>("stacktrace", false);
-        close_session = params.getParsed<bool>("close_session", false);
+
+        if (params.getParsed<bool>("stacktrace", false) && server.config().getBool("enable_http_stacktrace", true))
+            with_stacktrace = true;
+
+        if (params.getParsed<bool>("close_session", false) && server.config().getBool("enable_http_close_session", true))
+            close_session = true;
+
         if (close_session)
             session_id = params.get("session_id");
 
diff --git a/src/Server/HTTPHandlerFactory.cpp b/src/Server/HTTPHandlerFactory.cpp
index e1ee9586f83..66b55f68217 100644
--- a/src/Server/HTTPHandlerFactory.cpp
+++ b/src/Server/HTTPHandlerFactory.cpp
@@ -7,7 +7,6 @@
 #include <Poco/Util/AbstractConfiguration.h>
 
 #include "HTTPHandler.h"
-#include "NotFoundHandler.h"
 #include "StaticRequestHandler.h"
 #include "ReplicasStatusHandler.h"
 #include "InterserverIOHTTPHandler.h"
@@ -161,6 +160,12 @@ void addCommonDefaultHandlersFactory(HTTPRequestHandlerFactoryMain & factory, IS
     factory.addPathToHints("/dashboard");
     factory.addHandler(dashboard_handler);
 
+    auto binary_handler = std::make_shared<HandlingRuleHTTPHandlerFactory<WebUIRequestHandler>>(server);
+    binary_handler->attachNonStrictPath("/binary");
+    binary_handler->allowGetAndHeadRequest();
+    factory.addPathToHints("/binary");
+    factory.addHandler(binary_handler);
+
     auto js_handler = std::make_shared<HandlingRuleHTTPHandlerFactory<WebUIRequestHandler>>(server);
     js_handler->attachNonStrictPath("/js/");
     js_handler->allowGetAndHeadRequest();
diff --git a/src/Server/InterserverIOHTTPHandler.cpp b/src/Server/InterserverIOHTTPHandler.cpp
index 5f6da208778..53773a83b40 100644
--- a/src/Server/InterserverIOHTTPHandler.cpp
+++ b/src/Server/InterserverIOHTTPHandler.cpp
@@ -87,8 +87,7 @@ void InterserverIOHTTPHandler::handleRequest(HTTPServerRequest & request, HTTPSe
         response.setChunkedTransferEncoding(true);
 
     Output used_output;
-    const auto & config = server.config();
-    unsigned keep_alive_timeout = config.getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT);
+    const auto keep_alive_timeout = server.context()->getServerSettings().keep_alive_timeout.totalSeconds();
     used_output.out = std::make_shared<WriteBufferFromHTTPServerResponse>(
         response, request.getMethod() == Poco::Net::HTTPRequest::HTTP_HEAD, keep_alive_timeout);
 
diff --git a/src/Server/KeeperReadinessHandler.cpp b/src/Server/KeeperReadinessHandler.cpp
new file mode 100644
index 00000000000..ed972055aee
--- /dev/null
+++ b/src/Server/KeeperReadinessHandler.cpp
@@ -0,0 +1,94 @@
+#include <Server/KeeperReadinessHandler.h>
+
+#if USE_NURAFT
+
+#include <memory>
+
+#include <IO/HTTPCommon.h>
+#include <Coordination/KeeperDispatcher.h>
+#include <Server/HTTPHandlerFactory.h>
+#include <Server/HTTPHandlerRequestFilter.h>
+#include <Server/HTTP/WriteBufferFromHTTPServerResponse.h>
+#include <Poco/Net/HTTPRequestHandlerFactory.h>
+#include <Poco/Net/HTTPServerRequest.h>
+#include <Poco/Net/HTTPServerResponse.h>
+#include <Poco/JSON/JSON.h>
+#include <Poco/JSON/Object.h>
+#include <Poco/JSON/Stringifier.h>
+
+namespace DB
+{
+
+void KeeperReadinessHandler::handleRequest(HTTPServerRequest & /*request*/, HTTPServerResponse & response)
+{
+    try
+    {
+        auto is_leader = keeper_dispatcher->isLeader();
+        auto is_follower = keeper_dispatcher->isFollower() && keeper_dispatcher->hasLeader();
+        auto is_observer = keeper_dispatcher->isObserver() && keeper_dispatcher->hasLeader();
+
+        auto data = keeper_dispatcher->getKeeper4LWInfo();
+
+        auto status = is_leader || is_follower || is_observer;
+
+        Poco::JSON::Object json, details;
+
+        details.set("role", data.getRole());
+        details.set("hasLeader", keeper_dispatcher->hasLeader());
+        json.set("details", details);
+        json.set("status", status ? "ok" : "fail");
+
+        std::ostringstream oss;     // STYLE_CHECK_ALLOW_STD_STRING_STREAM
+        oss.exceptions(std::ios::failbit);
+        Poco::JSON::Stringifier::stringify(json, oss);
+
+        if (!status)
+            response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_SERVICE_UNAVAILABLE);
+
+        *response.send() << oss.str();
+    }
+    catch (...)
+    {
+        tryLogCurrentException("KeeperReadinessHandler");
+
+        try
+        {
+            response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_INTERNAL_SERVER_ERROR);
+
+            if (!response.sent())
+            {
+                /// We have not sent anything yet and we don't even know if we need to compress response.
+                *response.send() << getCurrentExceptionMessage(false) << std::endl;
+            }
+        }
+        catch (...)
+        {
+            LOG_ERROR((&Poco::Logger::get("KeeperReadinessHandler")), "Cannot send exception to client");
+        }
+    }
+}
+
+HTTPRequestHandlerFactoryPtr createKeeperHTTPControlMainHandlerFactory(
+    const Poco::Util::AbstractConfiguration & config,
+    std::shared_ptr<KeeperDispatcher> keeper_dispatcher,
+    const std::string & name)
+{
+    auto factory = std::make_shared<HTTPRequestHandlerFactoryMain>(name);
+    using Factory = HandlingRuleHTTPHandlerFactory<KeeperReadinessHandler>;
+    Factory::Creator creator = [keeper_dispatcher]() -> std::unique_ptr<KeeperReadinessHandler>
+    {
+        return std::make_unique<KeeperReadinessHandler>(keeper_dispatcher);
+    };
+
+    auto readiness_handler = std::make_shared<Factory>(std::move(creator));
+
+    readiness_handler->attachStrictPath(config.getString("keeper_server.http_control.readiness.endpoint", "/ready"));
+    readiness_handler->allowGetAndHeadRequest();
+    factory->addHandler(readiness_handler);
+
+    return factory;
+}
+
+}
+
+#endif
diff --git a/src/Server/KeeperReadinessHandler.h b/src/Server/KeeperReadinessHandler.h
new file mode 100644
index 00000000000..00b51b886f9
--- /dev/null
+++ b/src/Server/KeeperReadinessHandler.h
@@ -0,0 +1,36 @@
+#pragma once
+
+#include <config.h>
+
+#if USE_NURAFT
+
+#include <Server/HTTP/HTTPRequestHandler.h>
+#include <Server/HTTP/HTTPRequestHandlerFactory.h>
+#include <Coordination/KeeperDispatcher.h>
+
+namespace DB
+{
+
+class KeeperReadinessHandler : public HTTPRequestHandler, WithContext
+{
+private:
+    std::shared_ptr<KeeperDispatcher> keeper_dispatcher;
+
+public:
+    explicit KeeperReadinessHandler(std::shared_ptr<KeeperDispatcher> keeper_dispatcher_)
+        : keeper_dispatcher(keeper_dispatcher_)
+    {
+    }
+
+    void handleRequest(HTTPServerRequest & request, HTTPServerResponse & response) override;
+};
+
+HTTPRequestHandlerFactoryPtr
+createKeeperHTTPControlMainHandlerFactory(
+    const Poco::Util::AbstractConfiguration & config,
+    std::shared_ptr<KeeperDispatcher> keeper_dispatcher,
+    const std::string & name);
+
+}
+
+#endif
diff --git a/src/Server/KeeperTCPHandler.cpp b/src/Server/KeeperTCPHandler.cpp
index 9b8fd069531..76b84f0ce6e 100644
--- a/src/Server/KeeperTCPHandler.cpp
+++ b/src/Server/KeeperTCPHandler.cpp
@@ -83,7 +83,7 @@ struct SocketInterruptablePollWrapper
 #if defined(POCO_HAVE_FD_EPOLL)
         epollfd = epoll_create(2);
         if (epollfd < 0)
-            throwFromErrno("Cannot epoll_create", ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot epoll_create");
 
         socket_event.events = EPOLLIN | EPOLLERR | EPOLLPRI;
         socket_event.data.fd = sockfd;
@@ -92,7 +92,7 @@ struct SocketInterruptablePollWrapper
             int err = ::close(epollfd);
             chassert(!err || errno == EINTR);
 
-            throwFromErrno("Cannot insert socket into epoll queue", ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot insert socket into epoll queue");
         }
         pipe_event.events = EPOLLIN | EPOLLERR | EPOLLPRI;
         pipe_event.data.fd = pipe.fds_rw[0];
@@ -101,7 +101,7 @@ struct SocketInterruptablePollWrapper
             int err = ::close(epollfd);
             chassert(!err || errno == EINTR);
 
-            throwFromErrno("Cannot insert socket into epoll queue", ErrorCodes::SYSTEM_ERROR);
+            throw ErrnoException(ErrorCodes::SYSTEM_ERROR, "Cannot insert socket into epoll queue");
         }
 #endif
     }
diff --git a/src/Server/MySQLHandlerFactory.cpp b/src/Server/MySQLHandlerFactory.cpp
index deadb10f9a9..f74f57926f9 100644
--- a/src/Server/MySQLHandlerFactory.cpp
+++ b/src/Server/MySQLHandlerFactory.cpp
@@ -67,10 +67,8 @@ void MySQLHandlerFactory::readRSAKeys()
         FILE * fp = fopen(certificate_file.data(), "r");
         if (fp == nullptr)
             throw Exception(ErrorCodes::CANNOT_OPEN_FILE, "Cannot open certificate file: {}.", certificate_file);
-        SCOPE_EXIT(
-            if (0 != fclose(fp))
-                throwFromErrno("Cannot close file with the certificate in MySQLHandlerFactory", ErrorCodes::CANNOT_CLOSE_FILE);
-        );
+        SCOPE_EXIT(if (0 != fclose(fp)) throw ErrnoException(
+                       ErrorCodes::CANNOT_CLOSE_FILE, "Cannot close file with the certificate in MySQLHandlerFactory"););
 
         X509 * x509 = PEM_read_X509(fp, nullptr, nullptr, nullptr);
         SCOPE_EXIT(X509_free(x509));
@@ -93,10 +91,8 @@ void MySQLHandlerFactory::readRSAKeys()
         FILE * fp = fopen(private_key_file.data(), "r");
         if (fp == nullptr)
             throw Exception(ErrorCodes::CANNOT_OPEN_FILE, "Cannot open private key file {}.", private_key_file);
-        SCOPE_EXIT(
-            if (0 != fclose(fp))
-                throwFromErrno("Cannot close file with the certificate in MySQLHandlerFactory", ErrorCodes::CANNOT_CLOSE_FILE);
-        );
+        SCOPE_EXIT(if (0 != fclose(fp)) throw ErrnoException(
+                       ErrorCodes::CANNOT_CLOSE_FILE, "Cannot close file with the certificate in MySQLHandlerFactory"););
 
         private_key.reset(PEM_read_RSAPrivateKey(fp, nullptr, nullptr, nullptr));
         if (!private_key)
diff --git a/src/Server/PrometheusMetricsWriter.cpp b/src/Server/PrometheusMetricsWriter.cpp
index fa8b8f9c352..662a15a522a 100644
--- a/src/Server/PrometheusMetricsWriter.cpp
+++ b/src/Server/PrometheusMetricsWriter.cpp
@@ -121,6 +121,8 @@ void PrometheusMetricsWriter::write(WriteBuffer & wb) const
 
     if (send_errors)
     {
+        size_t total_count = 0;
+
         for (size_t i = 0, end = ErrorCodes::end(); i < end; ++i)
         {
             const auto & error = ErrorCodes::values[i].get();
@@ -136,7 +138,15 @@ void PrometheusMetricsWriter::write(WriteBuffer & wb) const
             writeOutLine(wb, "# TYPE", key, "counter");
             /// We are interested in errors which are happened only on this server.
             writeOutLine(wb, key, error.local.count);
+
+            total_count += error.local.count;
         }
+
+        /// Write the total number of errors as a separate metric
+        std::string key{error_metrics_prefix + toString("ALL")};
+        writeOutLine(wb, "# HELP", key, "The total number of errors since last server restart");
+        writeOutLine(wb, "# TYPE", key, "counter");
+        writeOutLine(wb, key, total_count);
     }
 
 }
diff --git a/src/Server/PrometheusRequestHandler.cpp b/src/Server/PrometheusRequestHandler.cpp
index 6d35386bfb5..127ed843cb6 100644
--- a/src/Server/PrometheusRequestHandler.cpp
+++ b/src/Server/PrometheusRequestHandler.cpp
@@ -17,6 +17,9 @@ void PrometheusRequestHandler::handleRequest(HTTPServerRequest & request, HTTPSe
 {
     try
     {
+        /// Raw config reference is used here to avoid dependency on Context and ServerSettings.
+        /// This is painful, because this class is also used in a build with CLICKHOUSE_KEEPER_STANDALONE_BUILD=1
+        /// And there ordinary Context is replaced with a tiny clone.
         const auto & config = server.config();
         unsigned keep_alive_timeout = config.getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT);
 
diff --git a/src/Server/ProxyV1Handler.cpp b/src/Server/ProxyV1Handler.cpp
index 56621940a23..d5e6ab23360 100644
--- a/src/Server/ProxyV1Handler.cpp
+++ b/src/Server/ProxyV1Handler.cpp
@@ -29,38 +29,38 @@ void ProxyV1Handler::run()
 
     // read "PROXY"
     if (!readWord(5, word, eol) || word != "PROXY" || eol)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     // read "TCP4" or "TCP6" or "UNKNOWN"
     if (!readWord(7, word, eol))
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     if (word != "TCP4" && word != "TCP6" && word != "UNKNOWN")
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     if (word == "UNKNOWN" && eol)
         return;
 
     if (eol)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     // read address
     if (!readWord(39, word, eol) || eol)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     stack_data.forwarded_for = std::move(word);
 
     // read address
     if (!readWord(39, word, eol) || eol)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     // read port
     if (!readWord(5, word, eol) || eol)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     // read port and "\r\n"
     if (!readWord(5, word, eol) || !eol)
-        throw ParsingException(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
+        throw Exception(ErrorCodes::CANNOT_PARSE_INPUT_ASSERTION_FAILED, "PROXY protocol violation");
 
     if (!stack_data.forwarded_for.empty())
         LOG_TRACE(log, "Forwarded client address from PROXY header: {}", stack_data.forwarded_for);
diff --git a/src/Server/ReplicasStatusHandler.cpp b/src/Server/ReplicasStatusHandler.cpp
index ad54b24f31d..c30c3ebaa77 100644
--- a/src/Server/ReplicasStatusHandler.cpp
+++ b/src/Server/ReplicasStatusHandler.cpp
@@ -28,11 +28,17 @@ void ReplicasStatusHandler::handleRequest(HTTPServerRequest & request, HTTPServe
     {
         HTMLForm params(getContext()->getSettingsRef(), request);
 
-        /// Even if lag is small, output detailed information about the lag.
-        bool verbose = params.get("verbose", "") == "1";
+        const auto & config = getContext()->getConfigRef();
 
         const MergeTreeSettings & settings = getContext()->getReplicatedMergeTreeSettings();
 
+        /// Even if lag is small, output detailed information about the lag.
+        bool verbose = false;
+        bool enable_verbose = config.getBool("enable_verbose_replicas_status", true);
+
+        if (params.get("verbose", "") == "1" && enable_verbose)
+            verbose = true;
+
         bool ok = true;
         WriteBufferFromOwnString message;
 
@@ -78,13 +84,14 @@ void ReplicasStatusHandler::handleRequest(HTTPServerRequest & request, HTTPServe
             }
         }
 
-        const auto & config = getContext()->getConfigRef();
-        setResponseDefaultHeaders(response, config.getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT));
+        const auto & server_settings = getContext()->getServerSettings();
+        setResponseDefaultHeaders(response, server_settings.keep_alive_timeout.totalSeconds());
 
         if (!ok)
         {
             response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_SERVICE_UNAVAILABLE);
-            verbose = true;
+            if (enable_verbose)
+                verbose = true;
         }
 
         if (verbose)
diff --git a/src/Server/ServerType.cpp b/src/Server/ServerType.cpp
index fb052e7d6e6..b0511632e6e 100644
--- a/src/Server/ServerType.cpp
+++ b/src/Server/ServerType.cpp
@@ -144,6 +144,9 @@ bool ServerType::shouldStop(const std::string & port_name) const
         port_custom_name = port_name.substr(protocols_size, port_name.size() - protocols_size - ports_size + 1);
     }
 
+    else if (port_name == "cloud.port")
+        port_type = Type::CLOUD;
+
     else
         return false;
 
diff --git a/src/Server/ServerType.h b/src/Server/ServerType.h
index e3544fe6a28..c31fb663811 100644
--- a/src/Server/ServerType.h
+++ b/src/Server/ServerType.h
@@ -11,9 +11,9 @@ class ServerType
 public:
     enum Type
     {
-        TCP,
         TCP_WITH_PROXY,
         TCP_SECURE,
+        TCP,
         HTTP,
         HTTPS,
         MYSQL,
@@ -26,6 +26,7 @@ public:
         QUERIES_ALL,
         QUERIES_DEFAULT,
         QUERIES_CUSTOM,
+        CLOUD,
         END
     };
 
diff --git a/src/Server/StaticRequestHandler.cpp b/src/Server/StaticRequestHandler.cpp
index a7e85d161c1..34cb5d2d169 100644
--- a/src/Server/StaticRequestHandler.cpp
+++ b/src/Server/StaticRequestHandler.cpp
@@ -34,7 +34,7 @@ namespace ErrorCodes
 }
 
 static inline WriteBufferPtr
-responseWriteBuffer(HTTPServerRequest & request, HTTPServerResponse & response, unsigned int keep_alive_timeout)
+responseWriteBuffer(HTTPServerRequest & request, HTTPServerResponse & response, UInt64 keep_alive_timeout)
 {
     /// The client can pass a HTTP header indicating supported compression method (gzip or deflate).
     String http_response_compression_methods = request.get("Accept-Encoding", "");
@@ -90,7 +90,7 @@ static inline void trySendExceptionToClient(
 
 void StaticRequestHandler::handleRequest(HTTPServerRequest & request, HTTPServerResponse & response)
 {
-    auto keep_alive_timeout = server.config().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT);
+    auto keep_alive_timeout = server.context()->getServerSettings().keep_alive_timeout.totalSeconds();
     const auto & out = responseWriteBuffer(request, response, keep_alive_timeout);
 
     try
diff --git a/src/Server/TCPHandler.cpp b/src/Server/TCPHandler.cpp
index f2d7a58119f..a563e0e0004 100644
--- a/src/Server/TCPHandler.cpp
+++ b/src/Server/TCPHandler.cpp
@@ -657,7 +657,7 @@ void TCPHandler::runImpl()
         catch (...)
         {
             state.io.onException();
-            exception = std::make_unique<DB::Exception>(ErrorCodes::UNKNOWN_EXCEPTION, "Unknown exception");
+            exception = std::make_unique<DB::Exception>(Exception(ErrorCodes::UNKNOWN_EXCEPTION, "Unknown exception"));
         }
 
         try
diff --git a/src/Server/WebUIRequestHandler.cpp b/src/Server/WebUIRequestHandler.cpp
index 12d2588723e..ad48b38b91a 100644
--- a/src/Server/WebUIRequestHandler.cpp
+++ b/src/Server/WebUIRequestHandler.cpp
@@ -1,10 +1,10 @@
 #include "WebUIRequestHandler.h"
 #include "IServer.h"
 
-#include <Poco/Net/HTTPServerRequest.h>
 #include <Poco/Net/HTTPServerResponse.h>
 #include <Poco/Util/LayeredConfiguration.h>
 
+#include <Interpreters/Context.h>
 #include <IO/HTTPCommon.h>
 
 #ifdef __clang__
@@ -24,6 +24,7 @@
 INCBIN(resource_play_html, SOURCE_DIR "/programs/server/play.html");
 INCBIN(resource_dashboard_html, SOURCE_DIR "/programs/server/dashboard.html");
 INCBIN(resource_uplot_js, SOURCE_DIR "/programs/server/js/uplot.js");
+INCBIN(resource_binary_html, SOURCE_DIR "/programs/server/binary.html");
 
 
 namespace DB
@@ -37,7 +38,7 @@ WebUIRequestHandler::WebUIRequestHandler(IServer & server_)
 
 void WebUIRequestHandler::handleRequest(HTTPServerRequest & request, HTTPServerResponse & response)
 {
-    auto keep_alive_timeout = server.config().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT);
+    auto keep_alive_timeout = server.context()->getServerSettings().keep_alive_timeout.totalSeconds();
 
     response.setContentType("text/html; charset=UTF-8");
 
@@ -67,6 +68,11 @@ void WebUIRequestHandler::handleRequest(HTTPServerRequest & request, HTTPServerR
 
         *response.send() << html;
     }
+    else if (request.getURI().starts_with("/binary"))
+    {
+        response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_OK);
+        *response.send() << std::string_view(reinterpret_cast<const char *>(gresource_binary_htmlData), gresource_binary_htmlSize);
+    }
     else if (request.getURI() == "/js/uplot.js")
     {
         response.setStatusAndReason(Poco::Net::HTTPResponse::HTTP_OK);
diff --git a/src/Storages/AlterCommands.cpp b/src/Storages/AlterCommands.cpp
index d19f92ae767..9fc785373b3 100644
--- a/src/Storages/AlterCommands.cpp
+++ b/src/Storages/AlterCommands.cpp
@@ -402,6 +402,14 @@ std::optional<AlterCommand> AlterCommand::parse(const ASTAlterCommand * command_
         command.select = command_ast->select;
         return command;
     }
+    else if (command_ast->type == ASTAlterCommand::MODIFY_REFRESH)
+    {
+        AlterCommand command;
+        command.ast = command_ast->clone();
+        command.type = AlterCommand::MODIFY_REFRESH;
+        command.refresh = command_ast->refresh;
+        return command;
+    }
     else if (command_ast->type == ASTAlterCommand::RENAME_COLUMN)
     {
         AlterCommand command;
@@ -707,7 +715,7 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, ContextPtr context)
     }
     else if (type == MODIFY_TTL)
     {
-        metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(ttl, metadata.columns, context, metadata.primary_key);
+        metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(ttl, metadata.columns, context, metadata.primary_key, context->getSettingsRef().allow_suspicious_ttl_expressions);
     }
     else if (type == REMOVE_TTL)
     {
@@ -715,7 +723,7 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, ContextPtr context)
     }
     else if (type == MODIFY_QUERY)
     {
-        metadata.select = SelectQueryDescription::getSelectQueryFromASTForMatView(select, context);
+        metadata.select = SelectQueryDescription::getSelectQueryFromASTForMatView(select, metadata.refresh != nullptr, context);
         Block as_select_sample;
 
         if (context->getSettingsRef().allow_experimental_analyzer)
@@ -732,6 +740,10 @@ void AlterCommand::apply(StorageInMemoryMetadata & metadata, ContextPtr context)
 
         metadata.columns = ColumnsDescription(as_select_sample.getNamesAndTypesList());
     }
+    else if (type == MODIFY_REFRESH)
+    {
+        metadata.refresh = refresh->clone();
+    }
     else if (type == MODIFY_SETTING)
     {
         auto & settings_from_storage = metadata.settings_changes->as<ASTSetQuery &>().changes;
@@ -1136,13 +1148,13 @@ void AlterCommands::apply(StorageInMemoryMetadata & metadata, ContextPtr context
     metadata_copy.column_ttls_by_name.clear();
     for (const auto & [name, ast] : column_ttl_asts)
     {
-        auto new_ttl_entry = TTLDescription::getTTLFromAST(ast, metadata_copy.columns, context, metadata_copy.primary_key);
+        auto new_ttl_entry = TTLDescription::getTTLFromAST(ast, metadata_copy.columns, context, metadata_copy.primary_key, context->getSettingsRef().allow_suspicious_ttl_expressions);
         metadata_copy.column_ttls_by_name[name] = new_ttl_entry;
     }
 
     if (metadata_copy.table_ttl.definition_ast != nullptr)
         metadata_copy.table_ttl = TTLTableDescription::getTTLForTableFromAST(
-            metadata_copy.table_ttl.definition_ast, metadata_copy.columns, context, metadata_copy.primary_key);
+            metadata_copy.table_ttl.definition_ast, metadata_copy.columns, context, metadata_copy.primary_key, context->getSettingsRef().allow_suspicious_ttl_expressions);
 
     metadata = std::move(metadata_copy);
 }
diff --git a/src/Storages/AlterCommands.h b/src/Storages/AlterCommands.h
index 26c20995991..f40fdc954ec 100644
--- a/src/Storages/AlterCommands.h
+++ b/src/Storages/AlterCommands.h
@@ -44,6 +44,7 @@ struct AlterCommand
         MODIFY_SETTING,
         RESET_SETTING,
         MODIFY_QUERY,
+        MODIFY_REFRESH,
         RENAME_COLUMN,
         REMOVE_TTL,
         MODIFY_DATABASE_SETTING,
@@ -145,6 +146,9 @@ struct AlterCommand
     /// For MODIFY_QUERY
     ASTPtr select = nullptr;
 
+    /// For MODIFY_REFRESH
+    ASTPtr refresh = nullptr;
+
     /// Target column name
     String rename_to;
 
diff --git a/src/Storages/Cache/SchemaCache.h b/src/Storages/Cache/SchemaCache.h
index 6f1ce917852..1bfc18bddab 100644
--- a/src/Storages/Cache/SchemaCache.h
+++ b/src/Storages/Cache/SchemaCache.h
@@ -29,10 +29,11 @@ public:
         String source;
         String format;
         String additional_format_info;
+        String schema_inference_mode;
 
         bool operator==(const Key & other) const
         {
-            return source == other.source && format == other.format && additional_format_info == other.additional_format_info;
+            return source == other.source && format == other.format && additional_format_info == other.additional_format_info && schema_inference_mode == other.schema_inference_mode;
         }
     };
 
@@ -42,7 +43,7 @@ public:
     {
         size_t operator()(const Key & key) const
         {
-            return std::hash<String>()(key.source + key.format + key.additional_format_info);
+            return std::hash<String>()(key.source + key.format + key.additional_format_info + key.schema_inference_mode);
         }
     };
 
diff --git a/src/Storages/ColumnsDescription.cpp b/src/Storages/ColumnsDescription.cpp
index cf8f341f9ff..697350faf09 100644
--- a/src/Storages/ColumnsDescription.cpp
+++ b/src/Storages/ColumnsDescription.cpp
@@ -53,17 +53,6 @@ ColumnDescription::ColumnDescription(String name_, DataTypePtr type_)
 {
 }
 
-bool ColumnDescription::identical(const ColumnDescription & other) const
-{
-    auto ast_to_str = [](const ASTPtr & ast) { return ast ? queryToString(ast) : String{}; };
-
-    return name == other.name
-        && type->identical(*other.type)
-        && default_desc == other.default_desc
-        && ast_to_str(codec) == ast_to_str(other.codec)
-        && ast_to_str(ttl) == ast_to_str(other.ttl);
-}
-
 bool ColumnDescription::operator==(const ColumnDescription & other) const
 {
     auto ast_to_str = [](const ASTPtr & ast) { return ast ? queryToString(ast) : String{}; };
@@ -325,6 +314,12 @@ void ColumnsDescription::flattenNested()
 {
     for (auto it = columns.begin(); it != columns.end();)
     {
+        if (!isNested(it->type))
+        {
+            ++it;
+            continue;
+        }
+
         const auto * type_arr = typeid_cast<const DataTypeArray *>(it->type.get());
         if (!type_arr)
         {
@@ -679,6 +674,12 @@ bool ColumnsDescription::hasPhysical(const String & column_name) const
         it->default_desc.kind != ColumnDefaultKind::Alias && it->default_desc.kind != ColumnDefaultKind::Ephemeral;
 }
 
+bool ColumnsDescription::hasNotAlias(const String & column_name) const
+{
+    auto it = columns.get<1>().find(column_name);
+    return it != columns.get<1>().end() && it->default_desc.kind != ColumnDefaultKind::Alias;
+}
+
 bool ColumnsDescription::hasAlias(const String & column_name) const
 {
     auto it = columns.get<1>().find(column_name);
@@ -894,13 +895,4 @@ Block validateColumnsDefaultsAndGetSampleBlock(ASTPtr default_expr_list, const N
     }
 }
 
-bool ColumnsDescription::identical(const ColumnsDescription & other) const
-{
-    if (columns.size() != other.columns.size())
-        return false;
-    for (auto it1 = columns.begin(), it2 = other.columns.begin(); it1 != columns.end(); ++it1, ++it2)
-        if (!it1->identical(*it2))
-            return false;
-    return true;
-}
 }
diff --git a/src/Storages/ColumnsDescription.h b/src/Storages/ColumnsDescription.h
index 688092f90da..4de8aa11de3 100644
--- a/src/Storages/ColumnsDescription.h
+++ b/src/Storages/ColumnsDescription.h
@@ -91,7 +91,6 @@ struct ColumnDescription
     ColumnDescription(const ColumnDescription &) = default;
     ColumnDescription(String name_, DataTypePtr type_);
 
-    bool identical(const ColumnDescription & other) const;
     bool operator==(const ColumnDescription & other) const;
     bool operator!=(const ColumnDescription & other) const { return !(*this == other); }
 
@@ -126,7 +125,6 @@ public:
     /// NOTE Must correspond with Nested::flatten function.
     void flattenNested(); /// TODO: remove, insert already flattened Nested columns.
 
-    bool identical(const ColumnsDescription & other) const;
     bool operator==(const ColumnsDescription & other) const { return columns == other.columns; }
     bool operator!=(const ColumnsDescription & other) const { return !(*this == other); }
 
@@ -184,6 +182,7 @@ public:
     Names getNamesOfPhysical() const;
 
     bool hasPhysical(const String & column_name) const;
+    bool hasNotAlias(const String & column_name) const;
     bool hasAlias(const String & column_name) const;
     bool hasColumnOrSubcolumn(GetColumnsOptions::Kind kind, const String & column_name) const;
     bool hasColumnOrNested(GetColumnsOptions::Kind kind, const String & column_name) const;
diff --git a/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp b/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp
index b82cf1d7ffc..97268cf1389 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp
+++ b/src/Storages/Distributed/DistributedAsyncInsertBatch.cpp
@@ -5,6 +5,7 @@
 #include <Storages/StorageDistributed.h>
 #include <QueryPipeline/RemoteInserter.h>
 #include <Common/CurrentMetrics.h>
+#include <base/defines.h>
 #include <IO/Operators.h>
 #include <IO/WriteBufferFromFile.h>
 
@@ -163,6 +164,22 @@ void DistributedAsyncInsertBatch::deserialize()
     readText(in);
 }
 
+bool DistributedAsyncInsertBatch::valid()
+{
+    chassert(!files.empty());
+
+    bool res = true;
+    for (const auto & file : files)
+    {
+        if (!fs::exists(file))
+        {
+            LOG_WARNING(parent.log, "File {} does not exists, likely due abnormal shutdown", file);
+            res = false;
+        }
+    }
+    return res;
+}
+
 void DistributedAsyncInsertBatch::writeText(WriteBuffer & out)
 {
     for (const auto & file : files)
@@ -201,14 +218,6 @@ void DistributedAsyncInsertBatch::sendBatch()
     {
         for (const auto & file : files)
         {
-            /// In case of recovery it is possible that some of files will be
-            /// missing, if server had been restarted abnormally
-            if (recovered && !fs::exists(file))
-            {
-                LOG_WARNING(parent.log, "File {} does not exists, likely due abnormal shutdown", file);
-                continue;
-            }
-
             ReadBufferFromFile in(file);
             const auto & distributed_header = DistributedAsyncInsertHeader::read(in, parent.log);
 
diff --git a/src/Storages/Distributed/DistributedAsyncInsertBatch.h b/src/Storages/Distributed/DistributedAsyncInsertBatch.h
index 867a0de89fa..db96634d6f1 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertBatch.h
+++ b/src/Storages/Distributed/DistributedAsyncInsertBatch.h
@@ -18,9 +18,16 @@ public:
     bool isEnoughSize() const;
     void send();
 
+    /// Write batch to current_batch.txt
     void serialize();
+
+    /// Read batch from current_batch.txt
     void deserialize();
 
+    /// Does all required files exists?
+    /// (The only way variant when it is valid is during restoring batch from disk).
+    bool valid();
+
     size_t total_rows = 0;
     size_t total_bytes = 0;
     std::vector<std::string> files;
diff --git a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
index 8479412ad64..26fa489a63d 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
+++ b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.cpp
@@ -7,7 +7,6 @@
 #include <Formats/NativeReader.h>
 #include <Processors/ISource.h>
 #include <Interpreters/Context.h>
-#include <Interpreters/Cluster.h>
 #include <IO/ReadBufferFromFile.h>
 #include <IO/WriteBufferFromFile.h>
 #include <IO/ConnectionTimeouts.h>
@@ -17,13 +16,14 @@
 #include <Common/StringUtils/StringUtils.h>
 #include <Common/SipHash.h>
 #include <Common/quoteString.h>
-#include <base/hex.h>
+#include <Common/ProfileEvents.h>
 #include <Common/ActionBlocker.h>
 #include <Common/formatReadable.h>
 #include <Common/Stopwatch.h>
 #include <Common/logger_useful.h>
 #include <Compression/CheckingCompressedReadBuffer.h>
 #include <IO/Operators.h>
+#include <base/hex.h>
 #include <boost/algorithm/string/find_iterator.hpp>
 #include <boost/algorithm/string/finder.hpp>
 #include <boost/range/adaptor/indexed.hpp>
@@ -39,6 +39,11 @@ namespace CurrentMetrics
     extern const Metric BrokenDistributedBytesToInsert;
 }
 
+namespace ProfileEvents
+{
+    extern const Event DistributedAsyncInsertionFailures;
+}
+
 namespace fs = std::filesystem;
 
 namespace DB
@@ -55,7 +60,7 @@ namespace
 {
 
 template <typename PoolFactory>
-ConnectionPoolPtrs createPoolsForAddresses(const std::string & name, PoolFactory && factory, const Cluster::ShardsInfo & shards_info, Poco::Logger * log)
+ConnectionPoolPtrs createPoolsForAddresses(const Cluster::Addresses & addresses, PoolFactory && factory, Poco::Logger * log)
 {
     ConnectionPoolPtrs pools;
 
@@ -76,30 +81,8 @@ ConnectionPoolPtrs createPoolsForAddresses(const std::string & name, PoolFactory
         }
     };
 
-    for (auto it = boost::make_split_iterator(name, boost::first_finder(",")); it != decltype(it){}; ++it)
-    {
-        const std::string & dirname = boost::copy_range<std::string>(*it);
-        Cluster::Address address = Cluster::Address::fromFullString(dirname);
-        if (address.shard_index && dirname.ends_with("_all_replicas"))
-        {
-            if (address.shard_index > shards_info.size())
-            {
-                LOG_ERROR(log, "No shard with shard_index={} ({})", address.shard_index, name);
-                continue;
-            }
-
-            const auto & shard_info = shards_info[address.shard_index - 1];
-            size_t replicas = shard_info.per_replica_pools.size();
-
-            for (size_t replica_index = 1; replica_index <= replicas; ++replica_index)
-            {
-                address.replica_index = static_cast<UInt32>(replica_index);
-                make_connection(address);
-            }
-        }
-        else
-            make_connection(address);
-    }
+    for (const auto & address : addresses)
+        make_connection(address);
 
     return pools;
 }
@@ -218,6 +201,15 @@ void DistributedAsyncInsertDirectoryQueue::run()
                 /// No errors while processing existing files.
                 /// Let's see maybe there are more files to process.
                 do_sleep = false;
+
+                const auto now = std::chrono::system_clock::now();
+                if (now - last_decrease_time > decrease_error_count_period)
+                {
+                    std::lock_guard status_lock(status_mutex);
+
+                    status.error_count /= 2;
+                    last_decrease_time = now;
+                }
             }
             catch (...)
             {
@@ -236,15 +228,6 @@ void DistributedAsyncInsertDirectoryQueue::run()
         else
             LOG_TEST(LogFrequencyLimiter(log, 30), "Skipping send data over distributed table.");
 
-        const auto now = std::chrono::system_clock::now();
-        if (now - last_decrease_time > decrease_error_count_period)
-        {
-            std::lock_guard status_lock(status_mutex);
-
-            status.error_count /= 2;
-            last_decrease_time = now;
-        }
-
         if (do_sleep)
             break;
     }
@@ -254,34 +237,14 @@ void DistributedAsyncInsertDirectoryQueue::run()
 }
 
 
-ConnectionPoolPtr DistributedAsyncInsertDirectoryQueue::createPool(const std::string & name, const StorageDistributed & storage)
+ConnectionPoolPtr DistributedAsyncInsertDirectoryQueue::createPool(const Cluster::Addresses & addresses, const StorageDistributed & storage)
 {
-    const auto pool_factory = [&storage, &name] (const Cluster::Address & address) -> ConnectionPoolPtr
+    const auto pool_factory = [&storage] (const Cluster::Address & address) -> ConnectionPoolPtr
     {
         const auto & cluster = storage.getCluster();
         const auto & shards_info = cluster->getShardsInfo();
         const auto & shards_addresses = cluster->getShardsAddresses();
 
-        /// Check new format shard{shard_index}_replica{replica_index}
-        /// (shard_index and replica_index starts from 1).
-        if (address.shard_index != 0)
-        {
-            if (!address.replica_index)
-                throw Exception(ErrorCodes::INCORRECT_FILE_NAME,
-                    "Wrong replica_index={} ({})", address.replica_index, name);
-
-            if (address.shard_index > shards_info.size())
-                throw Exception(ErrorCodes::INCORRECT_FILE_NAME,
-                    "No shard with shard_index={} ({})", address.shard_index, name);
-
-            const auto & shard_info = shards_info[address.shard_index - 1];
-            if (address.replica_index > shard_info.per_replica_pools.size())
-                throw Exception(ErrorCodes::INCORRECT_FILE_NAME,
-                    "No shard with replica_index={} ({})", address.replica_index, name);
-
-            return shard_info.per_replica_pools[address.replica_index - 1];
-        }
-
         /// Existing connections pool have a higher priority.
         for (size_t shard_index = 0; shard_index < shards_info.size(); ++shard_index)
         {
@@ -318,7 +281,7 @@ ConnectionPoolPtr DistributedAsyncInsertDirectoryQueue::createPool(const std::st
             address.secure);
     };
 
-    auto pools = createPoolsForAddresses(name, pool_factory, storage.getCluster()->getShardsInfo(), storage.log);
+    auto pools = createPoolsForAddresses(addresses, pool_factory, storage.log);
 
     const auto settings = storage.getContext()->getSettings();
     return pools.size() == 1 ? pools.front() : std::make_shared<ConnectionPoolWithFailover>(pools,
@@ -419,6 +382,8 @@ try
 }
 catch (...)
 {
+    ProfileEvents::increment(ProfileEvents::DistributedAsyncInsertionFailures);
+
     std::lock_guard status_lock(status_mutex);
 
     ++status.error_count;
@@ -559,7 +524,16 @@ void DistributedAsyncInsertDirectoryQueue::processFilesWithBatching()
 
         DistributedAsyncInsertBatch batch(*this);
         batch.deserialize();
-        batch.send();
+
+        /// In case of recovery it is possible that some of files will be
+        /// missing, if server had been restarted abnormally
+        /// (between unlink(*.bin) and unlink(current_batch.txt)).
+        ///
+        /// But current_batch_file_path should be removed anyway, since if some
+        /// file was missing, then the batch is not complete and there is no
+        /// point in trying to pretend that it will not break deduplication.
+        if (batch.valid())
+            batch.send();
 
         auto dir_sync_guard = getDirectorySyncGuard(relative_path);
         fs::remove(current_batch_file_path);
diff --git a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
index 114d3ef0331..8bbd99c786a 100644
--- a/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
+++ b/src/Storages/Distributed/DistributedAsyncInsertDirectoryQueue.h
@@ -4,6 +4,7 @@
 #include <Common/ConcurrentBoundedQueue.h>
 #include <Client/ConnectionPool.h>
 #include <IO/ReadBufferFromFile.h>
+#include <Interpreters/Cluster.h>
 #include <Disks/IDisk.h>
 #include <atomic>
 #include <mutex>
@@ -56,7 +57,7 @@ public:
 
     ~DistributedAsyncInsertDirectoryQueue();
 
-    static ConnectionPoolPtr createPool(const std::string & name, const StorageDistributed & storage);
+    static ConnectionPoolPtr createPool(const Cluster::Addresses & addresses, const StorageDistributed & storage);
 
     void updatePath(const std::string & new_relative_path);
 
diff --git a/src/Storages/Distributed/DistributedSettings.h b/src/Storages/Distributed/DistributedSettings.h
index 8f05d43e3f0..a326e6310dc 100644
--- a/src/Storages/Distributed/DistributedSettings.h
+++ b/src/Storages/Distributed/DistributedSettings.h
@@ -17,6 +17,8 @@ class ASTStorage;
 #define LIST_OF_DISTRIBUTED_SETTINGS(M, ALIAS) \
     M(Bool, fsync_after_insert, false, "Do fsync for every inserted. Will decreases performance of inserts (only for background INSERT, i.e. distributed_foreground_insert=false)", 0) \
     M(Bool, fsync_directories, false, "Do fsync for temporary directory (that is used for background INSERT only) after all part operations (writes, renames, etc.).", 0) \
+    /** This is the distributed version of the skip_unavailable_shards setting available in src/Core/Settings.h */ \
+    M(Bool, skip_unavailable_shards, false, "If true, ClickHouse silently skips unavailable shards. Shard is marked as unavailable when: 1) The shard cannot be reached due to a connection failure. 2) Shard is unresolvable through DNS. 3) Table does not exist on the shard.", 0) \
     /** Inserts settings. */ \
     M(UInt64, bytes_to_throw_insert, 0, "If more than this number of compressed bytes will be pending for background INSERT, an exception will be thrown. 0 - do not throw.", 0) \
     M(UInt64, bytes_to_delay_insert, 0, "If more than this number of compressed bytes will be pending for background INSERT, the query will be delayed. 0 - do not delay.", 0) \
diff --git a/src/Storages/FileLog/DirectoryWatcherBase.cpp b/src/Storages/FileLog/DirectoryWatcherBase.cpp
index 45a7f43fc95..8209483fac9 100644
--- a/src/Storages/FileLog/DirectoryWatcherBase.cpp
+++ b/src/Storages/FileLog/DirectoryWatcherBase.cpp
@@ -36,7 +36,7 @@ DirectoryWatcherBase::DirectoryWatcherBase(
 
     fd = inotify_init();
     if (fd == -1)
-        throwFromErrno("Cannot initialize inotify", ErrorCodes::IO_SETUP_ERROR);
+        throw ErrnoException(ErrorCodes::IO_SETUP_ERROR, "Cannot initialize inotify");
 
     watch_task = getContext()->getSchedulePool().createTask("directory_watch", [this] { watchFunc(); });
     start();
@@ -60,7 +60,7 @@ void DirectoryWatcherBase::watchFunc()
     if (wd == -1)
     {
         owner.onError(Exception(ErrorCodes::IO_SETUP_ERROR, "Watch directory {} failed", path));
-        throwFromErrnoWithPath("Watch directory {} failed", path, ErrorCodes::IO_SETUP_ERROR);
+        ErrnoException::throwFromPath(ErrorCodes::IO_SETUP_ERROR, path, "Watch directory {} failed", path);
     }
 
     std::string buffer;
diff --git a/src/Storages/HDFS/StorageHDFS.cpp b/src/Storages/HDFS/StorageHDFS.cpp
index 1e98ab5add6..fdbb5e9f171 100644
--- a/src/Storages/HDFS/StorageHDFS.cpp
+++ b/src/Storages/HDFS/StorageHDFS.cpp
@@ -75,6 +75,13 @@ namespace ErrorCodes
 }
 namespace
 {
+    struct HDFSFileInfoDeleter
+    {
+        /// Can have only one entry (see hdfsGetPathInfo())
+        void operator()(hdfsFileInfo * info) { hdfsFreeFileInfo(info, 1); }
+    };
+    using HDFSFileInfoPtr = std::unique_ptr<hdfsFileInfo, HDFSFileInfoDeleter>;
+
     /* Recursive directory listing with matched paths as a result.
      * Have the same method in StorageFile.
      */
@@ -90,13 +97,12 @@ namespace
         if (first_glob_pos == std::string::npos)
         {
             const String path = fs::path(path_for_ls + for_match.substr(1)).lexically_normal();
-            HDFSFileInfo ls;
-            ls.file_info = hdfsGetPathInfo(fs.get(), path.c_str());
-            if (ls.file_info != nullptr) // NOLINT
+            HDFSFileInfoPtr hdfs_info(hdfsGetPathInfo(fs.get(), path.c_str()));
+            if (hdfs_info) // NOLINT
             {
                 result.push_back(StorageHDFS::PathWithInfo{
                         String(path),
-                        StorageHDFS::PathInfo{ls.file_info->mLastMod, static_cast<size_t>(ls.file_info->mSize)}});
+                        StorageHDFS::PathInfo{hdfs_info->mLastMod, static_cast<size_t>(hdfs_info->mSize)}});
             }
             return result;
         }
@@ -184,13 +190,6 @@ namespace
         }
         return res;
     }
-
-    struct HDFSFileInfoDeleter
-    {
-        /// Can have only one entry (see hdfsGetPathInfo())
-        void operator()(hdfsFileInfo * info) { hdfsFreeFileInfo(info, 1); }
-    };
-    using HDFSFileInfoPtr = std::unique_ptr<hdfsFileInfo, HDFSFileInfoDeleter>;
 }
 
 StorageHDFS::StorageHDFS(
@@ -260,10 +259,17 @@ namespace
         {
         }
 
-        std::unique_ptr<ReadBuffer> next() override
+        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
         {
-            StorageHDFS::PathWithInfo path_with_info;
             bool is_first = current_index == 0;
+            /// For default mode check cached columns for all paths on first iteration.
+            if (is_first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            {
+                if (auto cached_columns = tryGetColumnsFromCache(paths_with_info))
+                    return {nullptr, cached_columns};
+            }
+
+            StorageHDFS::PathWithInfo path_with_info;
 
             while (true)
             {
@@ -273,26 +279,33 @@ namespace
                         throw Exception(ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
                                         "Cannot extract table structure from {} format file, because all files are empty. "
                                         "You must specify table structure manually", format);
-                    return nullptr;
+                    return {nullptr, std::nullopt};
                 }
 
                 path_with_info = paths_with_info[current_index++];
                 if (getContext()->getSettingsRef().hdfs_skip_empty_files && path_with_info.info && path_with_info.info->size == 0)
                     continue;
 
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
+                {
+                    std::vector<StorageHDFS::PathWithInfo> paths = {path_with_info};
+                    if (auto cached_columns = tryGetColumnsFromCache(paths))
+                        return {nullptr, cached_columns};
+                }
+
                 auto compression = chooseCompressionMethod(path_with_info.path, compression_method);
                 auto impl = std::make_unique<ReadBufferFromHDFS>(uri_without_path, path_with_info.path, getContext()->getGlobalContext()->getConfigRef(), getContext()->getReadSettings());
                 if (!getContext()->getSettingsRef().hdfs_skip_empty_files || !impl->eof())
                 {
                     const Int64 zstd_window_log_max = getContext()->getSettingsRef().zstd_window_log_max;
-                    return wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max));
+                    return {wrapReadBufferWithCompressionMethod(std::move(impl), compression, static_cast<int>(zstd_window_log_max)), std::nullopt};
                 }
             }
         }
 
         void setNumRowsToLastFile(size_t num_rows) override
         {
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3)
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_hdfs)
                 return;
 
             String source = uri_without_path + paths_with_info[current_index - 1].path;
@@ -300,7 +313,71 @@ namespace
             StorageHDFS::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
+        void setSchemaToLastFile(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_hdfs
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::UNION)
+                return;
+
+            String source = uri_without_path + paths_with_info[current_index - 1].path;
+            auto key = getKeyForSchemaCache(source, format, std::nullopt, getContext());
+            StorageHDFS::getSchemaCache(getContext()).addColumns(key, columns);
+        }
+
+        void setResultingSchema(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_hdfs
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::DEFAULT)
+                return;
+
+            Strings sources;
+            sources.reserve(paths_with_info.size());
+            std::transform(paths_with_info.begin(), paths_with_info.end(), std::back_inserter(sources), [&](const StorageHDFS::PathWithInfo & path_with_info){ return uri_without_path + path_with_info.path; });
+            auto cache_keys = getKeysForSchemaCache(sources, format, {}, getContext());
+            StorageHDFS::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
+        }
+
+        String getLastFileName() const override
+        {
+            if (current_index != 0)
+                return paths_with_info[current_index - 1].path;
+
+            return "";
+        }
+
     private:
+        std::optional<ColumnsDescription> tryGetColumnsFromCache(const std::vector<StorageHDFS::PathWithInfo> & paths_with_info_)
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_hdfs)
+                return std::nullopt;
+
+            auto & schema_cache = StorageHDFS::getSchemaCache(getContext());
+            for (const auto & path_with_info : paths_with_info_)
+            {
+                auto get_last_mod_time = [&]() -> std::optional<time_t>
+                {
+                    if (path_with_info.info)
+                        return path_with_info.info->last_mod_time;
+
+                    auto builder = createHDFSBuilder(uri_without_path + "/", getContext()->getGlobalContext()->getConfigRef());
+                    auto fs = createHDFSFS(builder.get());
+                    HDFSFileInfoPtr hdfs_info(hdfsGetPathInfo(fs.get(), path_with_info.path.c_str()));
+                    if (hdfs_info)
+                        return hdfs_info->mLastMod;
+
+                    return std::nullopt;
+                };
+
+                String url = uri_without_path + path_with_info.path;
+                auto cache_key = getKeyForSchemaCache(url, format, {}, getContext());
+                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
+                if (columns)
+                    return columns;
+            }
+
+            return std::nullopt;
+        }
+
         const std::vector<StorageHDFS::PathWithInfo> & paths_with_info;
         const String & uri_without_path;
         const String & format;
@@ -324,25 +401,8 @@ ColumnsDescription StorageHDFS::getTableStructureFromData(
             "Cannot extract table structure from {} format file, because there are no files in HDFS with provided path."
             " You must specify table structure manually", format);
 
-    std::optional<ColumnsDescription> columns_from_cache;
-    if (ctx->getSettingsRef().schema_inference_use_cache_for_hdfs)
-        columns_from_cache = tryGetColumnsFromCache(paths_with_info, uri_without_path, format, ctx);
-
-    ColumnsDescription columns;
-    if (columns_from_cache)
-    {
-        columns = *columns_from_cache;
-    }
-    else
-    {
-        ReadBufferIterator read_buffer_iterator(paths_with_info, uri_without_path, format, compression_method, ctx);
-        columns = readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, paths_with_info.size() > 1, ctx);
-    }
-
-    if (ctx->getSettingsRef().schema_inference_use_cache_for_hdfs)
-        addColumnsToCache(paths_with_info, uri_without_path, columns, format, ctx);
-
-    return columns;
+    ReadBufferIterator read_buffer_iterator(paths_with_info, uri_without_path, format, compression_method, ctx);
+    return readSchemaFromFormat(format, std::nullopt, read_buffer_iterator, paths_with_info.size() > 1, ctx);
 }
 
 class HDFSSource::DisclosedGlobIterator::Impl
@@ -549,7 +609,7 @@ bool HDFSSource::initialize()
         /// We should not return single chunk with all number of rows,
         /// because there is a chance that this chunk will be materialized later
         /// (it can cause memory problems even with default values in columns or when virtual columns are requested).
-        /// Instead, we use special ConstChunkGenerator that will generate chunks
+        /// Instead, we use a special ConstChunkGenerator that will generate chunks
         /// with max_block_size rows until total number of rows is reached.
         auto source = std::make_shared<ConstChunkGenerator>(block_for_format, *num_rows_from_cache, max_block_size);
         builder.init(Pipe(source));
@@ -576,7 +636,7 @@ bool HDFSSource::initialize()
     }
 
     /// Add ExtractColumnsTransform to extract requested columns/subcolumns
-    /// from chunk read by IInputFormat.
+    /// from the chunk read by IInputFormat.
     builder.addSimpleTransform([&](const Block & header)
     {
         return std::make_shared<ExtractColumnsTransform>(header, requested_columns);
@@ -980,54 +1040,6 @@ SchemaCache & StorageHDFS::getSchemaCache(const ContextPtr & ctx)
     return schema_cache;
 }
 
-std::optional<ColumnsDescription> StorageHDFS::tryGetColumnsFromCache(
-    const std::vector<StorageHDFS::PathWithInfo> & paths_with_info,
-    const String & uri_without_path,
-    const String & format_name,
-    const ContextPtr & ctx)
-{
-    auto & schema_cache = getSchemaCache(ctx);
-    for (const auto & path_with_info : paths_with_info)
-    {
-        auto get_last_mod_time = [&]() -> std::optional<time_t>
-        {
-            if (path_with_info.info)
-                return path_with_info.info->last_mod_time;
-
-            auto builder = createHDFSBuilder(uri_without_path + "/", ctx->getGlobalContext()->getConfigRef());
-            auto fs = createHDFSFS(builder.get());
-            HDFSFileInfoPtr hdfs_info(hdfsGetPathInfo(fs.get(), path_with_info.path.c_str()));
-            if (hdfs_info)
-                return hdfs_info->mLastMod;
-
-            return std::nullopt;
-        };
-
-        String url = uri_without_path + path_with_info.path;
-        auto cache_key = getKeyForSchemaCache(url, format_name, {}, ctx);
-        auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-        if (columns)
-            return columns;
-    }
-
-    return std::nullopt;
-}
-
-void StorageHDFS::addColumnsToCache(
-    const std::vector<StorageHDFS::PathWithInfo> & paths_with_info,
-    const String & uri_without_path,
-    const ColumnsDescription & columns,
-    const String & format_name,
-    const ContextPtr & ctx)
-{
-    auto & schema_cache = getSchemaCache(ctx);
-    Strings sources;
-    sources.reserve(paths_with_info.size());
-    std::transform(paths_with_info.begin(), paths_with_info.end(), std::back_inserter(sources), [&](const PathWithInfo & path_with_info){ return uri_without_path + path_with_info.path; });
-    auto cache_keys = getKeysForSchemaCache(sources, format_name, {}, ctx);
-    schema_cache.addManyColumns(cache_keys, columns);
-}
-
 }
 
 #endif
diff --git a/src/Storages/HDFS/StorageHDFS.h b/src/Storages/HDFS/StorageHDFS.h
index 5196f81d5f8..18eeb787d77 100644
--- a/src/Storages/HDFS/StorageHDFS.h
+++ b/src/Storages/HDFS/StorageHDFS.h
@@ -95,19 +95,6 @@ protected:
     friend class HDFSSource;
 
 private:
-    static std::optional<ColumnsDescription> tryGetColumnsFromCache(
-        const std::vector<StorageHDFS::PathWithInfo> & paths_with_info,
-        const String & uri_without_path,
-        const String & format_name,
-        const ContextPtr & ctx);
-
-    static void addColumnsToCache(
-        const std::vector<StorageHDFS::PathWithInfo> & paths,
-        const String & uri_without_path,
-        const ColumnsDescription & columns,
-        const String & format_name,
-        const ContextPtr & ctx);
-
     std::vector<String> uris;
     String format_name;
     String compression_method;
diff --git a/src/Storages/HDFS/WriteBufferFromHDFS.cpp b/src/Storages/HDFS/WriteBufferFromHDFS.cpp
index fad0447d2cf..6360bb2a3d5 100644
--- a/src/Storages/HDFS/WriteBufferFromHDFS.cpp
+++ b/src/Storages/HDFS/WriteBufferFromHDFS.cpp
@@ -95,8 +95,7 @@ struct WriteBufferFromHDFS::WriteBufferFromHDFSImpl
     {
         int result = hdfsSync(fs.get(), fout);
         if (result < 0)
-            throwFromErrno("Cannot HDFS sync" + hdfs_uri + " " + std::string(hdfsGetLastError()),
-                ErrorCodes::CANNOT_FSYNC);
+            throw ErrnoException(ErrorCodes::CANNOT_FSYNC, "Cannot HDFS sync {} {}", hdfs_uri, std::string(hdfsGetLastError()));
     }
 };
 
diff --git a/src/Storages/Hive/StorageHive.h b/src/Storages/Hive/StorageHive.h
index a3c47d400e2..8b378bf9e54 100644
--- a/src/Storages/Hive/StorageHive.h
+++ b/src/Storages/Hive/StorageHive.h
@@ -40,18 +40,8 @@ public:
 
     String getName() const override { return "Hive"; }
 
-    bool supportsIndexForIn() const override { return true; }
-
     bool supportsSubcolumns() const override { return true; }
 
-    bool mayBenefitFromIndexForIn(
-        const ASTPtr & /* left_in_operand */,
-        ContextPtr /* query_context */,
-        const StorageMetadataPtr & /* metadata_snapshot */) const override
-    {
-        return true;
-    }
-
     Pipe read(
         const Names & column_names,
         const StorageSnapshotPtr & storage_snapshot,
diff --git a/src/Storages/IStorage.cpp b/src/Storages/IStorage.cpp
index af1c032bc56..88603d56ebb 100644
--- a/src/Storages/IStorage.cpp
+++ b/src/Storages/IStorage.cpp
@@ -41,8 +41,8 @@ RWLockImpl::LockHolder IStorage::tryLockTimed(
     {
         const String type_str = type == RWLockImpl::Type::Read ? "READ" : "WRITE";
         throw Exception(ErrorCodes::DEADLOCK_AVOIDED,
-            "{} locking attempt on \"{}\" has timed out! ({}ms) Possible deadlock avoided. Client should retry",
-            type_str, getStorageID(), acquire_timeout.count());
+            "{} locking attempt on \"{}\" has timed out! ({}ms) Possible deadlock avoided. Client should retry. Owner query ids: {}",
+            type_str, getStorageID(), acquire_timeout.count(), rwlock->getOwnerQueryIdsDescription());
     }
     return lock_holder;
 }
diff --git a/src/Storages/IStorage.h b/src/Storages/IStorage.h
index 2a705b801da..1102c77ca58 100644
--- a/src/Storages/IStorage.h
+++ b/src/Storages/IStorage.h
@@ -599,13 +599,6 @@ public:
     std::atomic<bool> is_detached{false};
     std::atomic<bool> is_being_restarted{false};
 
-    /// Does table support index for IN sections
-    virtual bool supportsIndexForIn() const { return false; }
-
-    /// Provides a hint that the storage engine may evaluate the IN-condition by using an index.
-    virtual bool mayBenefitFromIndexForIn(const ASTPtr & /* left_in_operand */, ContextPtr /* query_context */, const StorageMetadataPtr & /* metadata_snapshot */) const { return false; }
-
-
     /** A list of tasks to check a validity of data.
       * Each IStorage implementation may interpret this task in its own way.
       * E.g. for some storages it's a list of files in filesystem, for others it can be a list of parts.
@@ -693,6 +686,15 @@ public:
     /// when considering in-memory blocks.
     virtual std::optional<UInt64> totalBytes(const Settings &) const { return {}; }
 
+    /// If it is possible to quickly determine exact number of uncompressed bytes for the table on storage:
+    /// - disk (uncompressed)
+    ///
+    /// Used for:
+    /// - For total_bytes_uncompressed column in system.tables
+    ///
+    /// Does not take underlying Storage (if any) into account
+    virtual std::optional<UInt64> totalBytesUncompressed(const Settings &) const { return {}; }
+
     /// Number of rows INSERTed since server start.
     ///
     /// Does not take the underlying Storage (if any) into account.
diff --git a/src/Storages/Kafka/KafkaConsumer.cpp b/src/Storages/Kafka/KafkaConsumer.cpp
index 31d431e27fe..40f2897322d 100644
--- a/src/Storages/Kafka/KafkaConsumer.cpp
+++ b/src/Storages/Kafka/KafkaConsumer.cpp
@@ -13,6 +13,7 @@
 
 #include <Common/CurrentMetrics.h>
 #include <Common/ProfileEvents.h>
+#include <base/defines.h>
 
 namespace CurrentMetrics
 {
@@ -46,15 +47,13 @@ const auto DRAIN_TIMEOUT_MS = 5000ms;
 
 
 KafkaConsumer::KafkaConsumer(
-    ConsumerPtr consumer_,
     Poco::Logger * log_,
     size_t max_batch_size,
     size_t poll_timeout_,
     bool intermediate_commit_,
     const std::atomic<bool> & stopped_,
     const Names & _topics)
-    : consumer(consumer_)
-    , log(log_)
+    : log(log_)
     , batch_size(max_batch_size)
     , poll_timeout(poll_timeout_)
     , intermediate_commit(intermediate_commit_)
@@ -63,6 +62,25 @@ KafkaConsumer::KafkaConsumer(
     , topics(_topics)
     , exceptions_buffer(EXCEPTIONS_DEPTH)
 {
+}
+
+void KafkaConsumer::createConsumer(cppkafka::Configuration consumer_config)
+{
+    chassert(!consumer.get());
+
+    /// Using this should be safe, since cppkafka::Consumer can poll messages
+    /// (including statistics, which will trigger the callback below) only via
+    /// KafkaConsumer.
+    if (consumer_config.get("statistics.interval.ms") != "0")
+    {
+        consumer_config.set_stats_callback([this](cppkafka::KafkaHandleBase &, const std::string & stat_json)
+        {
+            setRDKafkaStat(stat_json);
+        });
+    }
+    consumer = std::make_shared<cppkafka::Consumer>(consumer_config);
+    consumer->set_destroy_flags(RD_KAFKA_DESTROY_F_NO_CONSUMER_CLOSE);
+
     // called (synchronously, during poll) when we enter the consumer group
     consumer->set_assignment_callback([this](const cppkafka::TopicPartitionList & topic_partitions)
     {
@@ -133,8 +151,30 @@ KafkaConsumer::KafkaConsumer(
     });
 }
 
+ConsumerPtr && KafkaConsumer::moveConsumer()
+{
+    cleanUnprocessed();
+    if (!consumer->get_subscription().empty())
+    {
+        try
+        {
+            consumer->unsubscribe();
+        }
+        catch (const cppkafka::HandleException & e)
+        {
+            LOG_ERROR(log, "Error during unsubscribe: {}", e.what());
+        }
+        drain();
+    }
+    return std::move(consumer);
+}
+
 KafkaConsumer::~KafkaConsumer()
 {
+    if (!consumer)
+        return;
+
+    cleanUnprocessed();
     try
     {
         if (!consumer->get_subscription().empty())
@@ -154,7 +194,6 @@ KafkaConsumer::~KafkaConsumer()
     {
         LOG_ERROR(log, "Error while destructing consumer: {}", e.what());
     }
-
 }
 
 // Needed to drain rest of the messages / queued callback calls from the consumer
@@ -568,6 +607,9 @@ void KafkaConsumer::setExceptionInfo(const std::string & text, bool with_stacktr
  */
 std::string KafkaConsumer::getMemberId() const
 {
+    if (!consumer)
+        return "";
+
     char * memberid_ptr = rd_kafka_memberid(consumer->get_handle());
     std::string memberid_string = memberid_ptr;
     rd_kafka_mem_free(nullptr, memberid_ptr);
@@ -578,8 +620,14 @@ std::string KafkaConsumer::getMemberId() const
 KafkaConsumer::Stat KafkaConsumer::getStat() const
 {
     KafkaConsumer::Stat::Assignments assignments;
-    auto cpp_assignments = consumer->get_assignment();
-    auto cpp_offsets = consumer->get_offsets_position(cpp_assignments);
+    cppkafka::TopicPartitionList cpp_assignments;
+    cppkafka::TopicPartitionList cpp_offsets;
+
+    if (consumer)
+    {
+        cpp_assignments = consumer->get_assignment();
+        cpp_offsets = consumer->get_offsets_position(cpp_assignments);
+    }
 
     for (size_t num = 0; num < cpp_assignments.size(); ++num)
     {
@@ -591,7 +639,7 @@ KafkaConsumer::Stat KafkaConsumer::getStat() const
     }
 
     return {
-        .consumer_id = getMemberId() /* consumer->get_member_id() */ ,
+        .consumer_id = getMemberId(),
         .assignments = std::move(assignments),
         .last_poll_time = last_poll_timestamp_usec.load(),
         .num_messages_read = num_messages_read.load(),
@@ -601,11 +649,18 @@ KafkaConsumer::Stat KafkaConsumer::getStat() const
         .num_commits = num_commits.load(),
         .num_rebalance_assignments = num_rebalance_assignments.load(),
         .num_rebalance_revocations = num_rebalance_revocations.load(),
-        .exceptions_buffer = [&](){std::lock_guard<std::mutex> lock(exception_mutex);
-            return exceptions_buffer;}(),
+        .exceptions_buffer = [&]()
+        {
+            std::lock_guard<std::mutex> lock(exception_mutex);
+            return exceptions_buffer;
+        }(),
         .in_use = in_use.load(),
-        .rdkafka_stat = [&](){std::lock_guard<std::mutex> lock(rdkafka_stat_mutex);
-            return rdkafka_stat;}(),
+        .last_used_usec = last_used_usec.load(),
+        .rdkafka_stat = [&]()
+        {
+            std::lock_guard<std::mutex> lock(rdkafka_stat_mutex);
+            return rdkafka_stat;
+        }(),
     };
 }
 
diff --git a/src/Storages/Kafka/KafkaConsumer.h b/src/Storages/Kafka/KafkaConsumer.h
index f9758ff6c90..c4dfc56312f 100644
--- a/src/Storages/Kafka/KafkaConsumer.h
+++ b/src/Storages/Kafka/KafkaConsumer.h
@@ -57,12 +57,11 @@ public:
         UInt64 num_rebalance_revocations;
         KafkaConsumer::ExceptionsBuffer exceptions_buffer;
         bool in_use;
+        UInt64 last_used_usec;
         std::string rdkafka_stat;
     };
 
-public:
     KafkaConsumer(
-        ConsumerPtr consumer_,
         Poco::Logger * log_,
         size_t max_batch_size,
         size_t poll_timeout_,
@@ -72,6 +71,11 @@ public:
     );
 
     ~KafkaConsumer();
+
+    void createConsumer(cppkafka::Configuration consumer_config);
+    bool hasConsumer() const { return consumer.get() != nullptr; }
+    ConsumerPtr && moveConsumer();
+
     void commit(); // Commit all processed messages.
     void subscribe(); // Subscribe internal consumer to topics.
     void unsubscribe(); // Unsubscribe internal consumer in case of failure.
@@ -113,11 +117,20 @@ public:
         rdkafka_stat = stat_json_string;
     }
     void inUse() { in_use = true; }
-    void notInUse() { in_use = false; }
+    void notInUse()
+    {
+        in_use = false;
+        last_used_usec = std::chrono::duration_cast<std::chrono::microseconds>(std::chrono::system_clock::now().time_since_epoch()).count();
+    }
 
     // For system.kafka_consumers
     Stat getStat() const;
 
+    bool isInUse() const { return in_use; }
+    UInt64 getLastUsedUsec() const { return last_used_usec; }
+
+    std::string getMemberId() const;
+
 private:
     using Messages = std::vector<cppkafka::Message>;
     CurrentMetrics::Increment metric_increment{CurrentMetrics::KafkaConsumers};
@@ -132,6 +145,10 @@ private:
         ERRORS_RETURNED
     };
 
+    // order is important, need to be destructed *after* consumer
+    mutable std::mutex rdkafka_stat_mutex;
+    std::string rdkafka_stat;
+
     ConsumerPtr consumer;
     Poco::Logger * log;
     const size_t batch_size = 1;
@@ -145,11 +162,11 @@ private:
 
     const std::atomic<bool> & stopped;
 
-    // order is important, need to be destructed before consumer
+    // order is important, need to be destructed *before* consumer
     Messages messages;
     Messages::const_iterator current;
 
-    // order is important, need to be destructed before consumer
+    // order is important, need to be destructed *before* consumer
     std::optional<cppkafka::TopicPartitionList> assignment;
     const Names topics;
 
@@ -168,9 +185,8 @@ private:
     std::atomic<UInt64> num_rebalance_assignments = 0;
     std::atomic<UInt64> num_rebalance_revocations = 0;
     std::atomic<bool> in_use = 0;
-
-    mutable std::mutex rdkafka_stat_mutex;
-    std::string rdkafka_stat;
+    /// Last used time (for TTL)
+    std::atomic<UInt64> last_used_usec = 0;
 
     void drain();
     void cleanUnprocessed();
@@ -178,8 +194,6 @@ private:
     /// Return number of messages with an error.
     size_t filterMessageErrors();
     ReadBufferPtr getNextMessage();
-
-    std::string getMemberId() const;
 };
 
 }
diff --git a/src/Storages/Kafka/KafkaSettings.cpp b/src/Storages/Kafka/KafkaSettings.cpp
index 6ef74511d83..8e6883736dd 100644
--- a/src/Storages/Kafka/KafkaSettings.cpp
+++ b/src/Storages/Kafka/KafkaSettings.cpp
@@ -11,6 +11,7 @@ namespace DB
 namespace ErrorCodes
 {
     extern const int UNKNOWN_SETTING;
+    extern const int BAD_ARGUMENTS;
 }
 
 IMPLEMENT_SETTINGS_TRAITS(KafkaSettingsTraits, LIST_OF_KAFKA_SETTINGS)
@@ -38,4 +39,15 @@ void KafkaSettings::loadFromQuery(ASTStorage & storage_def)
     }
 }
 
+void KafkaSettings::sanityCheck() const
+{
+    if (kafka_consumers_pool_ttl_ms < KAFKA_RESCHEDULE_MS)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of 'kafka_consumers_pool_ttl_ms' ({}) cannot be less then rescheduled interval ({})",
+            kafka_consumers_pool_ttl_ms, KAFKA_RESCHEDULE_MS);
+
+    if (kafka_consumers_pool_ttl_ms > KAFKA_CONSUMERS_POOL_TTL_MS_MAX)
+        throw Exception(ErrorCodes::BAD_ARGUMENTS, "The value of 'kafka_consumers_pool_ttl_ms' ({}) cannot be too big (greater then {}), since this may cause live memory leaks",
+            kafka_consumers_pool_ttl_ms, KAFKA_CONSUMERS_POOL_TTL_MS_MAX);
+}
+
 }
diff --git a/src/Storages/Kafka/KafkaSettings.h b/src/Storages/Kafka/KafkaSettings.h
index 075e79c96f0..0addaf9e3b3 100644
--- a/src/Storages/Kafka/KafkaSettings.h
+++ b/src/Storages/Kafka/KafkaSettings.h
@@ -8,6 +8,12 @@ namespace DB
 {
 class ASTStorage;
 
+const auto KAFKA_RESCHEDULE_MS = 500;
+const auto KAFKA_CLEANUP_TIMEOUT_MS = 3000;
+// once per minute leave do reschedule (we can't lock threads in pool forever)
+const auto KAFKA_MAX_THREAD_WORK_DURATION_MS = 60000;
+// 10min
+const auto KAFKA_CONSUMERS_POOL_TTL_MS_MAX = 600'000;
 
 #define KAFKA_RELATED_SETTINGS(M, ALIAS) \
     M(String, kafka_broker_list, "", "A comma-separated list of brokers for Kafka engine.", 0) \
@@ -25,6 +31,7 @@ class ASTStorage;
     /* default is stream_poll_timeout_ms */ \
     M(Milliseconds, kafka_poll_timeout_ms, 0, "Timeout for single poll from Kafka.", 0) \
     M(UInt64, kafka_poll_max_batch_size, 0, "Maximum amount of messages to be polled in a single Kafka poll.", 0) \
+    M(UInt64, kafka_consumers_pool_ttl_ms, 60'000, "TTL for Kafka consumers (in milliseconds)", 0) \
     /* default is stream_flush_interval_ms */ \
     M(Milliseconds, kafka_flush_interval_ms, 0, "Timeout for flushing data from Kafka.", 0) \
     M(Bool, kafka_thread_per_consumer, false, "Provide independent thread for each consumer", 0) \
@@ -53,6 +60,8 @@ DECLARE_SETTINGS_TRAITS(KafkaSettingsTraits, LIST_OF_KAFKA_SETTINGS)
 struct KafkaSettings : public BaseSettings<KafkaSettingsTraits>
 {
     void loadFromQuery(ASTStorage & storage_def);
+
+    void sanityCheck() const;
 };
 
 }
diff --git a/src/Storages/Kafka/StorageKafka.cpp b/src/Storages/Kafka/StorageKafka.cpp
index c17defca673..1cb810cf8ad 100644
--- a/src/Storages/Kafka/StorageKafka.cpp
+++ b/src/Storages/Kafka/StorageKafka.cpp
@@ -27,10 +27,12 @@
 #include <Storages/StorageMaterializedView.h>
 #include <Storages/NamedCollectionsHelpers.h>
 #include <base/getFQDNOrHostName.h>
+#include <Common/Stopwatch.h>
 #include <Common/logger_useful.h>
 #include <boost/algorithm/string/replace.hpp>
 #include <boost/algorithm/string/split.hpp>
 #include <boost/algorithm/string/trim.hpp>
+#include <cppkafka/configuration.h>
 #include <librdkafka/rdkafka.h>
 #include <Poco/Util/AbstractConfiguration.h>
 #include <Common/Exception.h>
@@ -45,6 +47,7 @@
 #include <Common/config_version.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/ProfileEvents.h>
+#include <base/sleep.h>
 
 #if USE_KRB5
 #include <Access/KerberosInit.h>
@@ -76,6 +79,7 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int QUERY_NOT_ALLOWED;
+    extern const int ABORTED;
 }
 
 struct StorageKafkaInterceptors
@@ -172,10 +176,6 @@ struct StorageKafkaInterceptors
 
 namespace
 {
-    const auto RESCHEDULE_MS = 500;
-    const auto CLEANUP_TIMEOUT_MS = 3000;
-    const auto MAX_THREAD_WORK_DURATION_MS = 60000;  // once per minute leave do reschedule (we can't lock threads in pool forever)
-
     const String CONFIG_KAFKA_TAG = "kafka";
     const String CONFIG_KAFKA_TOPIC_TAG = "kafka_topic";
     const String CONFIG_NAME_TAG = "name";
@@ -262,17 +262,19 @@ StorageKafka::StorageKafka(
     , schema_name(getContext()->getMacros()->expand(kafka_settings->kafka_schema.value, macros_info))
     , num_consumers(kafka_settings->kafka_num_consumers.value)
     , log(&Poco::Logger::get("StorageKafka (" + table_id_.table_name + ")"))
-    , semaphore(0, static_cast<int>(num_consumers))
     , intermediate_commit(kafka_settings->kafka_commit_every_batch.value)
     , settings_adjustments(createSettingsAdjustments())
     , thread_per_consumer(kafka_settings->kafka_thread_per_consumer.value)
     , collection_name(collection_name_)
 {
+    kafka_settings->sanityCheck();
+
     if (kafka_settings->kafka_handle_error_mode == StreamingHandleErrorMode::STREAM)
     {
         kafka_settings->input_format_allow_errors_num = 0;
         kafka_settings->input_format_allow_errors_ratio = 0;
     }
+
     StorageInMemoryMetadata storage_metadata;
     storage_metadata.setColumns(columns_);
     setInMemoryMetadata(storage_metadata);
@@ -283,6 +285,18 @@ StorageKafka::StorageKafka(
         task->deactivate();
         tasks.emplace_back(std::make_shared<TaskContext>(std::move(task)));
     }
+
+    consumers.resize(num_consumers);
+    for (size_t i = 0; i < num_consumers; ++i)
+        consumers[i] = createKafkaConsumer(i);
+
+    cleanup_thread = std::make_unique<ThreadFromGlobalPool>([this]()
+    {
+        const auto & table = getStorageID().getTableName();
+        const auto & thread_name = std::string("KfkCln:") + table;
+        setThreadName(thread_name.c_str(), /*truncate=*/ true);
+        cleanConsumers();
+    });
 }
 
 SettingsChanges StorageKafka::createSettingsAdjustments()
@@ -343,8 +357,8 @@ Pipe StorageKafka::read(
     size_t /* max_block_size */,
     size_t /* num_streams */)
 {
-    if (num_created_consumers == 0)
-        return {};
+    if (shutdown_called)
+        throw Exception(ErrorCodes::ABORTED, "Table is detached");
 
     if (!local_context->getSettingsRef().stream_like_engine_allow_direct_select)
         throw Exception(ErrorCodes::QUERY_NOT_ALLOWED,
@@ -357,12 +371,12 @@ Pipe StorageKafka::read(
 
     /// Always use all consumers at once, otherwise SELECT may not read messages from all partitions.
     Pipes pipes;
-    pipes.reserve(num_created_consumers);
+    pipes.reserve(num_consumers);
     auto modified_context = Context::createCopy(local_context);
     modified_context->applySettingsChanges(settings_adjustments);
 
     // Claim as many consumers as requested, but don't block
-    for (size_t i = 0; i < num_created_consumers; ++i)
+    for (size_t i = 0; i < num_consumers; ++i)
     {
         /// Use block size of 1, otherwise LIMIT won't work properly as it will buffer excess messages in the last block
         /// TODO: probably that leads to awful performance.
@@ -412,21 +426,6 @@ SinkToStoragePtr StorageKafka::write(const ASTPtr &, const StorageMetadataPtr &
 
 void StorageKafka::startup()
 {
-    for (size_t i = 0; i < num_consumers; ++i)
-    {
-        try
-        {
-            auto consumer = createConsumer(i);
-            pushConsumer(consumer);
-            all_consumers.push_back(consumer);
-            ++num_created_consumers;
-        }
-        catch (const cppkafka::Exception &)
-        {
-            tryLogCurrentException(log);
-        }
-    }
-
     // Start the reader thread
     for (auto & task : tasks)
     {
@@ -437,21 +436,48 @@ void StorageKafka::startup()
 
 void StorageKafka::shutdown(bool)
 {
-    for (auto & task : tasks)
-    {
-        // Interrupt streaming thread
-        task->stream_cancelled = true;
+    shutdown_called = true;
+    cleanup_cv.notify_one();
 
-        LOG_TRACE(log, "Waiting for cleanup");
-        task->holder->deactivate();
+    {
+        LOG_TRACE(log, "Waiting for consumers cleanup thread");
+        Stopwatch watch;
+        if (cleanup_thread)
+        {
+            cleanup_thread->join();
+            cleanup_thread.reset();
+        }
+        LOG_TRACE(log, "Consumers cleanup thread finished in {} ms.", watch.elapsedMilliseconds());
     }
 
-    LOG_TRACE(log, "Closing consumers");
-    for (size_t i = 0; i < num_created_consumers; ++i)
-        auto consumer = popConsumer();
-    LOG_TRACE(log, "Consumers closed");
+    {
+        LOG_TRACE(log, "Waiting for streaming jobs");
+        Stopwatch watch;
+        for (auto & task : tasks)
+        {
+            // Interrupt streaming thread
+            task->stream_cancelled = true;
 
-    rd_kafka_wait_destroyed(CLEANUP_TIMEOUT_MS);
+            LOG_TEST(log, "Waiting for cleanup of a task");
+            task->holder->deactivate();
+        }
+        LOG_TRACE(log, "Streaming jobs finished in {} ms.", watch.elapsedMilliseconds());
+    }
+
+    {
+        std::lock_guard lock(mutex);
+        LOG_TRACE(log, "Closing {} consumers", consumers.size());
+        Stopwatch watch;
+        consumers.clear();
+        LOG_TRACE(log, "Consumers closed. Took {} ms.", watch.elapsedMilliseconds());
+    }
+
+    {
+        LOG_TRACE(log, "Waiting for final cleanup");
+        Stopwatch watch;
+        rd_kafka_wait_destroyed(KAFKA_CLEANUP_TIMEOUT_MS);
+        LOG_TRACE(log, "Final cleanup finished in {} ms (timeout {} ms).", watch.elapsedMilliseconds(), KAFKA_CLEANUP_TIMEOUT_MS);
+    }
 }
 
 
@@ -459,8 +485,7 @@ void StorageKafka::pushConsumer(KafkaConsumerPtr consumer)
 {
     std::lock_guard lock(mutex);
     consumer->notInUse();
-    consumers.push_back(consumer);
-    semaphore.set();
+    cv.notify_one();
     CurrentMetrics::sub(CurrentMetrics::KafkaConsumersInUse, 1);
 }
 
@@ -473,26 +498,88 @@ KafkaConsumerPtr StorageKafka::popConsumer()
 
 KafkaConsumerPtr StorageKafka::popConsumer(std::chrono::milliseconds timeout)
 {
-    // Wait for the first free buffer
-    if (timeout == std::chrono::milliseconds::zero())
-        semaphore.wait();
-    else
+    std::unique_lock lock(mutex);
+
+    KafkaConsumerPtr ret_consumer_ptr;
+    std::optional<size_t> closed_consumer_index;
+    for (size_t i = 0; i < consumers.size(); ++i)
     {
-        if (!semaphore.tryWait(timeout.count()))
-            return nullptr;
+        auto & consumer_ptr = consumers[i];
+
+        if (consumer_ptr->isInUse())
+            continue;
+
+        if (consumer_ptr->hasConsumer())
+        {
+            ret_consumer_ptr = consumer_ptr;
+            break;
+        }
+
+        if (!closed_consumer_index.has_value() && !consumer_ptr->hasConsumer())
+        {
+            closed_consumer_index = i;
+        }
     }
 
-    // Take the first available buffer from the list
-    std::lock_guard lock(mutex);
-    auto consumer = consumers.back();
-    consumers.pop_back();
-    CurrentMetrics::add(CurrentMetrics::KafkaConsumersInUse, 1);
-    consumer->inUse();
-    return consumer;
+    /// 1. There is consumer available - return it.
+    if (ret_consumer_ptr)
+    {
+        /// Noop
+    }
+    /// 2. There is no consumer, but we can create a new one.
+    else if (!ret_consumer_ptr && closed_consumer_index.has_value())
+    {
+        ret_consumer_ptr = consumers[*closed_consumer_index];
+
+        cppkafka::Configuration consumer_config = getConsumerConfiguration(*closed_consumer_index);
+        /// It should be OK to create consumer under lock, since it should be fast (without subscribing).
+        ret_consumer_ptr->createConsumer(consumer_config);
+        LOG_TRACE(log, "Created #{} consumer", *closed_consumer_index);
+    }
+    /// 3. There is no free consumer and num_consumers already created, waiting @timeout.
+    else
+    {
+        cv.wait_for(lock, timeout, [&]()
+        {
+            /// Note we are waiting only opened, free, consumers, since consumer cannot be closed right now
+            auto it = std::find_if(consumers.begin(), consumers.end(), [](const auto & ptr)
+            {
+                return !ptr->isInUse() && ptr->hasConsumer();
+            });
+            if (it != consumers.end())
+            {
+                ret_consumer_ptr = *it;
+                return true;
+            }
+            return false;
+        });
+    }
+
+    if (ret_consumer_ptr)
+    {
+        CurrentMetrics::add(CurrentMetrics::KafkaConsumersInUse, 1);
+        ret_consumer_ptr->inUse();
+    }
+    return ret_consumer_ptr;
 }
 
 
-KafkaConsumerPtr StorageKafka::createConsumer(size_t consumer_number)
+KafkaConsumerPtr StorageKafka::createKafkaConsumer(size_t consumer_number)
+{
+    /// NOTE: we pass |stream_cancelled| by reference here, so the buffers should not outlive the storage.
+    auto & stream_cancelled = thread_per_consumer ? tasks[consumer_number]->stream_cancelled : tasks.back()->stream_cancelled;
+
+    KafkaConsumerPtr kafka_consumer_ptr = std::make_shared<KafkaConsumer>(
+        log,
+        getPollMaxBatchSize(),
+        getPollTimeoutMillisecond(),
+        intermediate_commit,
+        stream_cancelled,
+        topics);
+    return kafka_consumer_ptr;
+}
+
+cppkafka::Configuration StorageKafka::getConsumerConfiguration(size_t consumer_number)
 {
     cppkafka::Configuration conf;
 
@@ -517,35 +604,66 @@ KafkaConsumerPtr StorageKafka::createConsumer(size_t consumer_number)
     size_t max_allowed_queued_min_messages = 10000000; // must be less than or equal to max allowed value
     conf.set("queued.min.messages", std::min(std::max(getMaxBlockSize(), default_queued_min_messages), max_allowed_queued_min_messages));
 
-    /// a reference to the consumer is needed in statistic callback
-    /// although the consumer does not exist when callback is being registered
-    /// shared_ptr<weak_ptr<KafkaConsumer>> comes to the rescue
-    auto consumer_weak_ptr_ptr = std::make_shared<KafkaConsumerWeakPtr>();
-    updateConfiguration(conf, consumer_weak_ptr_ptr);
+    updateConfiguration(conf);
 
     // those settings should not be changed by users.
     conf.set("enable.auto.commit", "false");       // We manually commit offsets after a stream successfully finished
     conf.set("enable.auto.offset.store", "false"); // Update offset automatically - to commit them all at once.
     conf.set("enable.partition.eof", "false");     // Ignore EOF messages
 
-    // Create a consumer and subscribe to topics
-    auto consumer_impl = std::make_shared<cppkafka::Consumer>(conf);
-    consumer_impl->set_destroy_flags(RD_KAFKA_DESTROY_F_NO_CONSUMER_CLOSE);
+    return conf;
+}
 
-    KafkaConsumerPtr kafka_consumer_ptr;
+void StorageKafka::cleanConsumers()
+{
+    UInt64 ttl_usec = kafka_settings->kafka_consumers_pool_ttl_ms * 1'000;
 
-    /// NOTE: we pass |stream_cancelled| by reference here, so the buffers should not outlive the storage.
-    if (thread_per_consumer)
+    std::unique_lock lock(mutex);
+    std::chrono::milliseconds timeout(KAFKA_RESCHEDULE_MS);
+    while (!cleanup_cv.wait_for(lock, timeout, [this]() { return shutdown_called == true; }))
     {
-        auto& stream_cancelled = tasks[consumer_number]->stream_cancelled;
-        kafka_consumer_ptr = std::make_shared<KafkaConsumer>(consumer_impl, log, getPollMaxBatchSize(), getPollTimeoutMillisecond(), intermediate_commit, stream_cancelled, topics);
+        /// Copy consumers for closing to a new vector to close them without a lock
+        std::vector<ConsumerPtr> consumers_to_close;
+
+        UInt64 now_usec = std::chrono::duration_cast<std::chrono::microseconds>(std::chrono::system_clock::now().time_since_epoch()).count();
+        {
+            for (size_t i = 0; i < consumers.size(); ++i)
+            {
+                auto & consumer_ptr = consumers[i];
+
+                UInt64 consumer_last_used_usec = consumer_ptr->getLastUsedUsec();
+                chassert(consumer_last_used_usec <= now_usec);
+
+                if (!consumer_ptr->hasConsumer())
+                    continue;
+                if (consumer_ptr->isInUse())
+                    continue;
+
+                if (now_usec - consumer_last_used_usec > ttl_usec)
+                {
+                    LOG_TRACE(log, "Closing #{} consumer (id: {})", i, consumer_ptr->getMemberId());
+                    consumers_to_close.push_back(consumer_ptr->moveConsumer());
+                }
+            }
+        }
+
+        if (!consumers_to_close.empty())
+        {
+            lock.unlock();
+
+            Stopwatch watch;
+            size_t closed = consumers_to_close.size();
+            consumers_to_close.clear();
+            LOG_TRACE(log, "{} consumers had been closed (due to {} usec timeout). Took {} ms.",
+                closed, ttl_usec, watch.elapsedMilliseconds());
+
+            lock.lock();
+        }
+
+        ttl_usec = kafka_settings->kafka_consumers_pool_ttl_ms * 1'000;
     }
-    else
-    {
-        kafka_consumer_ptr = std::make_shared<KafkaConsumer>(consumer_impl, log, getPollMaxBatchSize(), getPollTimeoutMillisecond(), intermediate_commit, tasks.back()->stream_cancelled, topics);
-    }
-    *consumer_weak_ptr_ptr = kafka_consumer_ptr;
-    return kafka_consumer_ptr;
+
+    LOG_TRACE(log, "Consumers cleanup thread finished");
 }
 
 size_t StorageKafka::getMaxBlockSize() const
@@ -578,8 +696,7 @@ String StorageKafka::getConfigPrefix() const
     return CONFIG_KAFKA_TAG;
 }
 
-void StorageKafka::updateConfiguration(cppkafka::Configuration & kafka_config,
-    std::shared_ptr<KafkaConsumerWeakPtr>  kafka_consumer_weak_ptr_ptr)
+void StorageKafka::updateConfiguration(cppkafka::Configuration & kafka_config)
 {
     // Update consumer configuration from the configuration. Example:
     //     <kafka>
@@ -659,24 +776,12 @@ void StorageKafka::updateConfiguration(cppkafka::Configuration & kafka_config,
         LOG_IMPL(log, client_logs_level, poco_level, "[rdk:{}] {}", facility, message);
     });
 
-    if (kafka_consumer_weak_ptr_ptr)
+    /// NOTE: statistics should be consumed, otherwise it creates too much
+    /// entries in the queue, that leads to memory leak and slow shutdown.
+    if (!config.has(config_prefix + "." + "statistics_interval_ms"))
     {
-        if (!config.has(config_prefix + "." + "statistics_interval_ms"))
-        {
-            kafka_config.set("statistics.interval.ms", "3000"); // every 3 seconds by default. set to 0 to disable.
-        }
-
-        if (kafka_config.get("statistics.interval.ms") != "0")
-        {
-            kafka_config.set_stats_callback([kafka_consumer_weak_ptr_ptr](cppkafka::KafkaHandleBase &, const std::string & stat_json_string)
-            {
-                auto kafka_consumer_ptr = kafka_consumer_weak_ptr_ptr->lock();
-                if (kafka_consumer_ptr)
-                {
-                    kafka_consumer_ptr->setRDKafkaStat(stat_json_string);
-                }
-            });
-        }
+        // every 3 seconds by default. set to 0 to disable.
+        kafka_config.set("statistics.interval.ms", "3000");
     }
 
     // Configure interceptor to change thread name
@@ -747,7 +852,7 @@ void StorageKafka::threadFunc(size_t idx)
             mv_attached.store(true);
 
             // Keep streaming as long as there are attached views and streaming is not cancelled
-            while (!task->stream_cancelled && num_created_consumers > 0)
+            while (!task->stream_cancelled)
             {
                 if (!checkDependencies(table_id))
                     break;
@@ -764,7 +869,7 @@ void StorageKafka::threadFunc(size_t idx)
 
                 auto ts = std::chrono::steady_clock::now();
                 auto duration = std::chrono::duration_cast<std::chrono::milliseconds>(ts-start_time);
-                if (duration.count() > MAX_THREAD_WORK_DURATION_MS)
+                if (duration.count() > KAFKA_MAX_THREAD_WORK_DURATION_MS)
                 {
                     LOG_TRACE(log, "Thread work duration limit exceeded. Reschedule.");
                     break;
@@ -784,13 +889,10 @@ void StorageKafka::threadFunc(size_t idx)
         LOG_ERROR(log, "{} {}", __PRETTY_FUNCTION__, exception_str);
 
         auto safe_consumers = getSafeConsumers();
-        for (auto const & consumer_ptr_weak : safe_consumers.consumers)
+        for (auto const & consumer_ptr : safe_consumers.consumers)
         {
             /// propagate materialized view exception to all consumers
-            if (auto consumer_ptr = consumer_ptr_weak.lock())
-            {
-                consumer_ptr->setExceptionInfo(exception_str, false /* no stacktrace, reuse passed one */);
-            }
+            consumer_ptr->setExceptionInfo(exception_str, false /* no stacktrace, reuse passed one */);
         }
     }
 
@@ -798,7 +900,7 @@ void StorageKafka::threadFunc(size_t idx)
 
     // Wait for attached views
     if (!task->stream_cancelled)
-        task->holder->scheduleAfter(RESCHEDULE_MS);
+        task->holder->scheduleAfter(KAFKA_RESCHEDULE_MS);
 }
 
 
@@ -835,7 +937,7 @@ bool StorageKafka::streamToViews()
     std::vector<std::shared_ptr<KafkaSource>> sources;
     Pipes pipes;
 
-    auto stream_count = thread_per_consumer ? 1 : num_created_consumers;
+    auto stream_count = thread_per_consumer ? 1 : num_consumers;
     sources.reserve(stream_count);
     pipes.reserve(stream_count);
     for (size_t i = 0; i < stream_count; ++i)
diff --git a/src/Storages/Kafka/StorageKafka.h b/src/Storages/Kafka/StorageKafka.h
index 9280809be0e..f60719538cf 100644
--- a/src/Storages/Kafka/StorageKafka.h
+++ b/src/Storages/Kafka/StorageKafka.h
@@ -1,5 +1,6 @@
 #pragma once
 
+#include <Common/ThreadPool_fwd.h>
 #include <Common/Macros.h>
 #include <Core/BackgroundSchedulePool.h>
 #include <Storages/IStorage.h>
@@ -9,16 +10,11 @@
 
 #include <Poco/Semaphore.h>
 
+#include <condition_variable>
 #include <mutex>
 #include <list>
 #include <atomic>
-
-namespace cppkafka
-{
-
-class Configuration;
-
-}
+#include <cppkafka/cppkafka.h>
 
 namespace DB
 {
@@ -28,7 +24,7 @@ class StorageSystemKafkaConsumers;
 struct StorageKafkaInterceptors;
 
 using KafkaConsumerPtr = std::shared_ptr<KafkaConsumer>;
-using KafkaConsumerWeakPtr = std::weak_ptr<KafkaConsumer>;
+using ConsumerPtr = std::shared_ptr<cppkafka::Consumer>;
 
 /** Implements a Kafka queue table engine that can be used as a persistent queue / buffer,
   * or as a basic building block for creating pipelines with a continuous insertion / ETL.
@@ -84,10 +80,10 @@ public:
     {
         std::shared_ptr<IStorage> storage_ptr;
         std::unique_lock<std::mutex> lock;
-        std::vector<KafkaConsumerWeakPtr> & consumers;
+        std::vector<KafkaConsumerPtr> & consumers;
     };
 
-    SafeConsumers getSafeConsumers() { return {shared_from_this(), std::unique_lock(mutex), all_consumers};  }
+    SafeConsumers getSafeConsumers() { return {shared_from_this(), std::unique_lock(mutex), consumers};  }
 
 private:
     // Configuration and state
@@ -102,20 +98,16 @@ private:
     const String schema_name;
     const size_t num_consumers; /// total number of consumers
     Poco::Logger * log;
-    Poco::Semaphore semaphore;
     const bool intermediate_commit;
     const SettingsChanges settings_adjustments;
 
     std::atomic<bool> mv_attached = false;
 
-    /// Can differ from num_consumers in case of exception in startup() (or if startup() hasn't been called).
-    /// In this case we still need to be able to shutdown() properly.
-    size_t num_created_consumers = 0; /// number of actually created consumers.
-
-    std::vector<KafkaConsumerPtr> consumers; /// available consumers
-    std::vector<KafkaConsumerWeakPtr> all_consumers; /// busy (belong to a KafkaSource) and vacant consumers
+    std::vector<KafkaConsumerPtr> consumers;
 
     std::mutex mutex;
+    std::condition_variable cv;
+    std::condition_variable cleanup_cv;
 
     // Stream thread
     struct TaskContext
@@ -129,12 +121,17 @@ private:
     std::vector<std::shared_ptr<TaskContext>> tasks;
     bool thread_per_consumer = false;
 
+    std::unique_ptr<ThreadFromGlobalPool> cleanup_thread;
+
     /// For memory accounting in the librdkafka threads.
     std::mutex thread_statuses_mutex;
     std::list<std::shared_ptr<ThreadStatus>> thread_statuses;
 
     SettingsChanges createSettingsAdjustments();
-    KafkaConsumerPtr createConsumer(size_t consumer_number);
+    /// Creates KafkaConsumer object without real consumer (cppkafka::Consumer)
+    KafkaConsumerPtr createKafkaConsumer(size_t consumer_number);
+    /// Returns consumer configuration with all changes that had been overwritten in config
+    cppkafka::Configuration getConsumerConfiguration(size_t consumer_number);
 
     /// If named_collection is specified.
     String collection_name;
@@ -142,11 +139,7 @@ private:
     std::atomic<bool> shutdown_called = false;
 
     // Update Kafka configuration with values from CH user configuration.
-    void updateConfiguration(cppkafka::Configuration & kafka_config, std::shared_ptr<KafkaConsumerWeakPtr>);
-    void updateConfiguration(cppkafka::Configuration & kafka_config)
-    {
-        updateConfiguration(kafka_config, std::make_shared<KafkaConsumerWeakPtr>());
-    }
+    void updateConfiguration(cppkafka::Configuration & kafka_config);
 
     String getConfigPrefix() const;
     void threadFunc(size_t idx);
@@ -161,6 +154,7 @@ private:
     bool streamToViews();
     bool checkDependencies(const StorageID & table_id);
 
+    void cleanConsumers();
 };
 
 }
diff --git a/src/Storages/MaterializedView/RefreshSchedule.cpp b/src/Storages/MaterializedView/RefreshSchedule.cpp
new file mode 100644
index 00000000000..87ac489e631
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshSchedule.cpp
@@ -0,0 +1,58 @@
+#include <Storages/MaterializedView/RefreshSchedule.h>
+
+#include <Common/thread_local_rng.h>
+
+namespace DB
+{
+
+RefreshSchedule::RefreshSchedule(const ASTRefreshStrategy & strategy)
+{
+    kind = strategy.schedule_kind;
+    period = strategy.period->interval;
+    if (strategy.offset)
+        offset = strategy.offset->interval;
+    if (strategy.spread)
+        spread = strategy.spread->interval;
+}
+
+bool RefreshSchedule::operator!=(const RefreshSchedule & rhs) const
+{
+    static_assert(sizeof(*this) == 7*8, "If fields were added or removed in RefreshSchedule, please update this comparator.");
+    return std::tie(kind, period, offset, spread) != std::tie(rhs.kind, rhs.period, rhs.offset, rhs.spread);
+}
+
+static std::chrono::sys_seconds advanceEvery(std::chrono::system_clock::time_point prev, CalendarTimeInterval period, CalendarTimeInterval offset)
+{
+    auto period_start = period.floor(prev);
+    auto t = offset.advance(period_start);
+    if (t > prev)
+        return t;
+    t = offset.advance(period.advance(period_start));
+    chassert(t > prev);
+    return t;
+}
+
+std::chrono::sys_seconds RefreshSchedule::prescribeNext(
+    std::chrono::system_clock::time_point last_prescribed, std::chrono::system_clock::time_point now) const
+{
+    if (kind == RefreshScheduleKind::AFTER)
+        return period.advance(now);
+
+    /// It's important to use prescribed instead of actual time here, otherwise we would do multiple
+    /// refreshes instead of one if the generated spread is negative and the the refresh completes
+    /// faster than the spread.
+    auto res = advanceEvery(last_prescribed, period, offset);
+    if (res < now)
+        res = advanceEvery(now, period, offset); // fell behind by a whole period, skip to current time
+
+    return res;
+}
+
+std::chrono::system_clock::time_point RefreshSchedule::addRandomSpread(std::chrono::sys_seconds prescribed_time) const
+{
+    Int64 ms = Int64(spread.minSeconds() * 1000 / 2);
+    auto add = std::uniform_int_distribution(-ms, ms)(thread_local_rng);
+    return prescribed_time + std::chrono::milliseconds(add);
+}
+
+}
diff --git a/src/Storages/MaterializedView/RefreshSchedule.h b/src/Storages/MaterializedView/RefreshSchedule.h
new file mode 100644
index 00000000000..db4ee1b99ce
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshSchedule.h
@@ -0,0 +1,29 @@
+#pragma once
+
+#include <Common/CalendarTimeInterval.h>
+#include <Parsers/ASTRefreshStrategy.h>
+#include <chrono>
+
+namespace DB
+{
+
+class ASTRefreshStrategy;
+
+struct RefreshSchedule
+{
+    RefreshScheduleKind kind;
+    CalendarTimeInterval period;
+    CalendarTimeInterval offset;
+    CalendarTimeInterval spread;
+
+    explicit RefreshSchedule(const ASTRefreshStrategy & strategy);
+    bool operator!=(const RefreshSchedule & rhs) const;
+
+    /// Tells when to do the next refresh (without random spread).
+    std::chrono::sys_seconds prescribeNext(
+        std::chrono::system_clock::time_point last_prescribed, std::chrono::system_clock::time_point now) const;
+
+    std::chrono::system_clock::time_point addRandomSpread(std::chrono::sys_seconds prescribed_time) const;
+};
+
+}
diff --git a/src/Storages/MaterializedView/RefreshSet.cpp b/src/Storages/MaterializedView/RefreshSet.cpp
new file mode 100644
index 00000000000..ac83d3d99c2
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshSet.cpp
@@ -0,0 +1,141 @@
+#include <Storages/MaterializedView/RefreshSet.h>
+#include <Storages/MaterializedView/RefreshTask.h>
+
+namespace CurrentMetrics
+{
+    extern const Metric RefreshableViews;
+}
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+}
+
+RefreshSet::Handle::Handle(Handle && other) noexcept
+{
+    *this = std::move(other);
+}
+
+RefreshSet::Handle & RefreshSet::Handle::operator=(Handle && other) noexcept
+{
+    if (this == &other)
+        return *this;
+    reset();
+    parent_set = std::exchange(other.parent_set, nullptr);
+    id = std::move(other.id);
+    dependencies = std::move(other.dependencies);
+    metric_increment = std::move(other.metric_increment);
+    return *this;
+}
+
+RefreshSet::Handle::~Handle()
+{
+    reset();
+}
+
+void RefreshSet::Handle::rename(StorageID new_id)
+{
+    std::lock_guard lock(parent_set->mutex);
+    parent_set->removeDependenciesLocked(id, dependencies);
+    auto it = parent_set->tasks.find(id);
+    auto task = it->second;
+    parent_set->tasks.erase(it);
+    id = new_id;
+    parent_set->tasks.emplace(id, task);
+    parent_set->addDependenciesLocked(id, dependencies);
+}
+
+void RefreshSet::Handle::changeDependencies(std::vector<StorageID> deps)
+{
+    std::lock_guard lock(parent_set->mutex);
+    parent_set->removeDependenciesLocked(id, dependencies);
+    dependencies = std::move(deps);
+    parent_set->addDependenciesLocked(id, dependencies);
+}
+
+void RefreshSet::Handle::reset()
+{
+    if (!parent_set)
+        return;
+
+    {
+        std::lock_guard lock(parent_set->mutex);
+        parent_set->removeDependenciesLocked(id, dependencies);
+        parent_set->tasks.erase(id);
+    }
+
+    parent_set = nullptr;
+    metric_increment.reset();
+}
+
+RefreshSet::RefreshSet() = default;
+
+RefreshSet::Handle RefreshSet::emplace(StorageID id, const std::vector<StorageID> & dependencies, RefreshTaskHolder task)
+{
+    std::lock_guard guard(mutex);
+    auto [it, is_inserted] = tasks.emplace(id, task);
+    if (!is_inserted)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Refresh set entry already exists for table {}", id.getFullTableName());
+    addDependenciesLocked(id, dependencies);
+
+    return Handle(this, id, dependencies);
+}
+
+void RefreshSet::addDependenciesLocked(const StorageID & id, const std::vector<StorageID> & dependencies)
+{
+    for (const StorageID & dep : dependencies)
+        dependents[dep].insert(id);
+}
+
+void RefreshSet::removeDependenciesLocked(const StorageID & id, const std::vector<StorageID> & dependencies)
+{
+    for (const StorageID & dep : dependencies)
+    {
+        auto & set = dependents[dep];
+        set.erase(id);
+        if (set.empty())
+            dependents.erase(dep);
+    }
+}
+
+RefreshTaskHolder RefreshSet::getTask(const StorageID & id) const
+{
+    std::lock_guard lock(mutex);
+    if (auto task = tasks.find(id); task != tasks.end())
+        return task->second;
+    return nullptr;
+}
+
+RefreshSet::InfoContainer RefreshSet::getInfo() const
+{
+    std::unique_lock lock(mutex);
+    auto tasks_copy = tasks;
+    lock.unlock();
+
+    InfoContainer res;
+    for (auto [id, task] : tasks_copy)
+        res.push_back(task->getInfo());
+    return res;
+}
+
+std::vector<RefreshTaskHolder> RefreshSet::getDependents(const StorageID & id) const
+{
+    std::lock_guard lock(mutex);
+    std::vector<RefreshTaskHolder> res;
+    auto it = dependents.find(id);
+    if (it == dependents.end())
+        return {};
+    for (const StorageID & dep_id : it->second)
+        if (auto task = tasks.find(dep_id); task != tasks.end())
+            res.push_back(task->second);
+    return res;
+}
+
+RefreshSet::Handle::Handle(RefreshSet * parent_set_, StorageID id_, std::vector<StorageID> dependencies_)
+    : parent_set(parent_set_), id(std::move(id_)), dependencies(std::move(dependencies_))
+    , metric_increment(CurrentMetrics::Increment(CurrentMetrics::RefreshableViews)) {}
+
+}
diff --git a/src/Storages/MaterializedView/RefreshSet.h b/src/Storages/MaterializedView/RefreshSet.h
new file mode 100644
index 00000000000..63e022b6d4d
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshSet.h
@@ -0,0 +1,109 @@
+#pragma once
+
+#include <Parsers/ASTIdentifier.h>
+#include <Storages/IStorage.h>
+#include <Storages/MaterializedView/RefreshTask_fwd.h>
+
+#include <Common/CurrentMetrics.h>
+
+namespace DB
+{
+
+using DatabaseAndTableNameSet = std::unordered_set<StorageID, StorageID::DatabaseAndTableNameHash, StorageID::DatabaseAndTableNameEqual>;
+
+enum class RefreshState : RefreshTaskStateUnderlying
+{
+    Disabled = 0,
+    Scheduled,
+    WaitingForDependencies,
+    Running,
+};
+
+enum class LastRefreshResult : RefreshTaskStateUnderlying
+{
+    Unknown = 0,
+    Cancelled,
+    Exception,
+    Finished
+};
+
+struct RefreshInfo
+{
+    StorageID view_id = StorageID::createEmpty();
+    RefreshState state = RefreshState::Scheduled;
+    LastRefreshResult last_refresh_result = LastRefreshResult::Unknown;
+    std::optional<UInt32> last_attempt_time;
+    std::optional<UInt32> last_success_time;
+    UInt64 last_attempt_duration_ms = 0;
+    UInt32 next_refresh_time = 0;
+    UInt64 refresh_count = 0;
+    String exception_message; // if last_refresh_result is Exception
+    std::vector<StorageID> remaining_dependencies;
+    ProgressValues progress;
+};
+
+/// Set of refreshable views
+class RefreshSet
+{
+public:
+    /// RAII thing that unregisters a task and its dependencies in destructor.
+    /// Storage IDs must be unique. Not thread safe.
+    class Handle
+    {
+        friend class RefreshSet;
+    public:
+        Handle() = default;
+
+        Handle(Handle &&) noexcept;
+        Handle & operator=(Handle &&) noexcept;
+
+        ~Handle();
+
+        void rename(StorageID new_id);
+        void changeDependencies(std::vector<StorageID> deps);
+
+        void reset();
+
+        explicit operator bool() const { return parent_set != nullptr; }
+
+        const StorageID & getID() const { return id; }
+        const std::vector<StorageID> & getDependencies() const { return dependencies; }
+
+    private:
+        RefreshSet * parent_set = nullptr;
+        StorageID id = StorageID::createEmpty();
+        std::vector<StorageID> dependencies;
+        std::optional<CurrentMetrics::Increment> metric_increment;
+
+        Handle(RefreshSet * parent_set_, StorageID id_, std::vector<StorageID> dependencies_);
+    };
+
+    using InfoContainer = std::vector<RefreshInfo>;
+
+    RefreshSet();
+
+    Handle emplace(StorageID id, const std::vector<StorageID> & dependencies, RefreshTaskHolder task);
+
+    RefreshTaskHolder getTask(const StorageID & id) const;
+
+    InfoContainer getInfo() const;
+
+    /// Get tasks that depend on the given one.
+    std::vector<RefreshTaskHolder> getDependents(const StorageID & id) const;
+
+private:
+    using TaskMap = std::unordered_map<StorageID, RefreshTaskHolder, StorageID::DatabaseAndTableNameHash, StorageID::DatabaseAndTableNameEqual>;
+    using DependentsMap = std::unordered_map<StorageID, DatabaseAndTableNameSet, StorageID::DatabaseAndTableNameHash, StorageID::DatabaseAndTableNameEqual>;
+
+    /// Protects the two maps below, not locked for any nontrivial operations (e.g. operations that
+    /// block or lock other mutexes).
+    mutable std::mutex mutex;
+
+    TaskMap tasks;
+    DependentsMap dependents;
+
+    void addDependenciesLocked(const StorageID & id, const std::vector<StorageID> & dependencies);
+    void removeDependenciesLocked(const StorageID & id, const std::vector<StorageID> & dependencies);
+};
+
+}
diff --git a/src/Storages/MaterializedView/RefreshSettings.cpp b/src/Storages/MaterializedView/RefreshSettings.cpp
new file mode 100644
index 00000000000..a00f9b398c6
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshSettings.cpp
@@ -0,0 +1,8 @@
+#include <Storages/MaterializedView/RefreshSettings.h>
+
+namespace DB
+{
+
+IMPLEMENT_SETTINGS_TRAITS(RefreshSettingsTraits, LIST_OF_REFRESH_SETTINGS)
+
+}
diff --git a/src/Storages/MaterializedView/RefreshSettings.h b/src/Storages/MaterializedView/RefreshSettings.h
new file mode 100644
index 00000000000..814c7e52b32
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshSettings.h
@@ -0,0 +1,16 @@
+#pragma once
+
+#include <Core/BaseSettings.h>
+
+namespace DB
+{
+
+#define LIST_OF_REFRESH_SETTINGS(M, ALIAS) \
+    /// TODO: Add settings
+    ///       M(UInt64, name, 42, "...", 0)
+
+DECLARE_SETTINGS_TRAITS(RefreshSettingsTraits, LIST_OF_REFRESH_SETTINGS)
+
+struct RefreshSettings : public BaseSettings<RefreshSettingsTraits> {};
+
+}
diff --git a/src/Storages/MaterializedView/RefreshTask.cpp b/src/Storages/MaterializedView/RefreshTask.cpp
new file mode 100644
index 00000000000..bc26301e3b9
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshTask.cpp
@@ -0,0 +1,512 @@
+#include <Storages/MaterializedView/RefreshTask.h>
+
+#include <Storages/StorageMaterializedView.h>
+
+#include <Common/CurrentMetrics.h>
+#include <Interpreters/Context.h>
+#include <Interpreters/InterpreterInsertQuery.h>
+#include <Interpreters/InterpreterDropQuery.h>
+#include <Interpreters/ProcessList.h>
+#include <Parsers/ASTCreateQuery.h>
+#include <Processors/Executors/PipelineExecutor.h>
+#include <QueryPipeline/ReadProgressCallback.h>
+
+namespace CurrentMetrics
+{
+    extern const Metric RefreshingViews;
+}
+
+namespace DB
+{
+
+namespace ErrorCodes
+{
+    extern const int LOGICAL_ERROR;
+    extern const int QUERY_WAS_CANCELLED;
+}
+
+RefreshTask::RefreshTask(
+    const ASTRefreshStrategy & strategy)
+    : log(&Poco::Logger::get("RefreshTask"))
+    , refresh_schedule(strategy)
+{}
+
+RefreshTaskHolder RefreshTask::create(
+    const StorageMaterializedView & view,
+    ContextMutablePtr context,
+    const DB::ASTRefreshStrategy & strategy)
+{
+    auto task = std::make_shared<RefreshTask>(strategy);
+
+    task->refresh_task = context->getSchedulePool().createTask("MaterializedViewRefresherTask",
+        [self = task->weak_from_this()]
+        {
+            if (auto t = self.lock())
+                t->refreshTask();
+        });
+
+    std::vector<StorageID> deps;
+    if (strategy.dependencies)
+        for (auto && dependency : strategy.dependencies->children)
+            deps.emplace_back(dependency->as<const ASTTableIdentifier &>());
+
+    task->set_handle = context->getRefreshSet().emplace(view.getStorageID(), deps, task);
+
+    return task;
+}
+
+void RefreshTask::initializeAndStart(std::shared_ptr<StorageMaterializedView> view)
+{
+    view_to_refresh = view;
+    if (view->getContext()->getSettingsRef().stop_refreshable_materialized_views_on_startup)
+        stop_requested = true;
+    populateDependencies();
+    advanceNextRefreshTime(currentTime());
+    refresh_task->schedule();
+}
+
+void RefreshTask::rename(StorageID new_id)
+{
+    std::lock_guard guard(mutex);
+    set_handle.rename(new_id);
+}
+
+void RefreshTask::alterRefreshParams(const DB::ASTRefreshStrategy & new_strategy)
+{
+    std::lock_guard guard(mutex);
+
+    RefreshSchedule new_schedule(new_strategy);
+    std::vector<StorageID> deps;
+    if (new_strategy.dependencies)
+        for (auto && dependency : new_strategy.dependencies->children)
+            deps.emplace_back(dependency->as<const ASTTableIdentifier &>());
+
+    /// Reschedule next refresh.
+    if (new_schedule != refresh_schedule)
+    {
+        refresh_schedule = new_schedule;
+        next_refresh_prescribed = {};
+        advanceNextRefreshTime(currentTime());
+        refresh_task->schedule();
+    }
+
+    /// Update dependency graph.
+    set_handle.changeDependencies(deps);
+
+    /// Mark removed dependencies as satisfied.
+    DatabaseAndTableNameSet deps_set(deps.begin(), deps.end());
+    std::vector<StorageID> removed_deps;
+    for (const auto & id : remaining_dependencies)
+        if (!deps_set.contains(id))
+            removed_deps.push_back(id);
+    for (const auto & id : removed_deps)
+        if (arriveDependency(id) && !std::exchange(refresh_immediately, true))
+            refresh_task->schedule();
+
+    /// TODO: Update settings once we have them.
+}
+
+RefreshInfo RefreshTask::getInfo() const
+{
+    std::lock_guard guard(mutex);
+    auto res = info;
+    res.view_id = set_handle.getID();
+    res.remaining_dependencies.assign(remaining_dependencies.begin(), remaining_dependencies.end());
+    if (res.last_refresh_result != LastRefreshResult::Exception)
+        res.exception_message.clear();
+    res.progress = progress.getValues();
+    return res;
+}
+
+void RefreshTask::start()
+{
+    std::lock_guard guard(mutex);
+    if (!std::exchange(stop_requested, false))
+        return;
+    refresh_task->schedule();
+}
+
+void RefreshTask::stop()
+{
+    std::lock_guard guard(mutex);
+    if (std::exchange(stop_requested, true))
+        return;
+    interruptExecution();
+    refresh_task->schedule();
+}
+
+void RefreshTask::run()
+{
+    std::lock_guard guard(mutex);
+    if (std::exchange(refresh_immediately, true))
+        return;
+    refresh_task->schedule();
+}
+
+void RefreshTask::cancel()
+{
+    std::lock_guard guard(mutex);
+    interruptExecution();
+    refresh_task->schedule();
+}
+
+void RefreshTask::shutdown()
+{
+    {
+        std::lock_guard guard(mutex);
+        stop_requested = true;
+        interruptExecution();
+    }
+
+    /// Wait for the task to return and prevent it from being scheduled in future.
+    refresh_task->deactivate();
+
+    /// Remove from RefreshSet on DROP, without waiting for the IStorage to be destroyed.
+    /// This matters because a table may get dropped and immediately created again with the same name,
+    /// while the old table's IStorage still exists (pinned by ongoing queries).
+    /// (Also, RefreshSet holds a shared_ptr to us.)
+    std::lock_guard guard(mutex);
+    set_handle.reset();
+}
+
+void RefreshTask::notify(const StorageID & parent_id, std::chrono::sys_seconds parent_next_prescribed_time)
+{
+    std::lock_guard guard(mutex);
+    if (!set_handle)
+        return; // we've shut down
+
+    /// In the general case, it's not clear what the meaning of dependencies should be.
+    /// E.g. what behavior would the user want/expect in the following cases?:
+    ///  * REFRESH EVERY 3 HOUR depends on REFRESH EVERY 2 HOUR
+    ///  * REFRESH AFTER 3 HOUR depends on REFRESH AFTER 2 HOUR
+    ///  * REFRESH AFTER 3 HOUR depends on REFRESH EVERY 1 DAY
+    /// I don't know.
+    ///
+    /// Cases that are important to support well include:
+    /// (1) REFRESH EVERY 1 DAY depends on REFRESH EVERY 1 DAY
+    ///     Here the second refresh should start only after the first refresh completed *for the same day*.
+    ///     Yesterday's refresh of the dependency shouldn't trigger today's refresh of the dependent,
+    ///     even if it completed today.
+    /// (2) REFRESH EVERY 1 DAY OFFSET 2 HOUR depends on REFRESH EVERY 1 DAY OFFSET 1 HOUR
+    /// (3) REFRESH EVERY 1 DAY OFFSET 1 HOUR depends on REFRESH EVERY 1 DAY OFFSET 23 HOUR
+    ///     Here the dependency's refresh on day X should trigger dependent's refresh on day X+1.
+    /// (4) REFRESH EVERY 2 HOUR depends on REFRESH EVERY 1 HOUR
+    ///     The 2 HOUR refresh should happen after the 1 HOUR refresh for every other hour, e.g.
+    ///     after the 2pm refresh, then after the 4pm refresh, etc.
+    ///
+    /// We currently don't allow dependencies in REFRESH AFTER case, because its unclear how to define
+    /// it in a non-confusing way. Consider view y that depends on view x, both with
+    /// REFRESH AFTER 1 hour. The user's intention is probably to make y always refresh immediately
+    /// after x. But suppose y takes slightly longer to refresh than x. If we don't do anything
+    /// special, x's refresh schedule will run ahead, and the DEPENDS ON will have pretty much no
+    /// effect - confusing! As a dirty way to prevent this, we could just decrease refresh period by,
+    /// say, 50%, if the view has dependencies at all. But that still sounds more confusing than useful.
+    /// Or we could say that we only refresh y if x refreshes less than 10% of 1 HOUR ago, so in our
+    /// scenario y would be refreshing every 2 hours instead of 1 hour sometimes.
+
+    /// Only accept the dependency's refresh if its next refresh time is after ours.
+    /// This takes care of cases (1)-(4).
+    if (parent_next_prescribed_time <= next_refresh_prescribed)
+        return;
+
+    if (arriveDependency(parent_id) && !std::exchange(refresh_immediately, true))
+        refresh_task->schedule();
+}
+
+void RefreshTask::setFakeTime(std::optional<Int64> t)
+{
+    std::unique_lock lock(mutex);
+    fake_clock.store(t.value_or(INT64_MIN), std::memory_order_relaxed);
+    /// Reschedule task with shorter delay if currently scheduled.
+    refresh_task->scheduleAfter(100, /*overwrite*/ true, /*only_if_scheduled*/ true);
+}
+
+void RefreshTask::refreshTask()
+{
+    try
+    {
+        std::unique_lock lock(mutex);
+
+        /// Whoever breaks out of this loop should assign info.state first.
+        while (true)
+        {
+            chassert(lock.owns_lock());
+
+            interrupt_execution.store(false);
+
+            if (stop_requested)
+            {
+                /// Exit the task and wait for the user to start or resume, which will schedule the task again.
+                info.state = RefreshState::Disabled;
+                break;
+            }
+
+            if (!refresh_immediately)
+            {
+                auto now = currentTime();
+                if (now >= next_refresh_with_spread)
+                {
+                    if (arriveTime())
+                        refresh_immediately = true;
+                    else
+                    {
+                        info.state = RefreshState::WaitingForDependencies;
+                        break;
+                    }
+                }
+                else
+                {
+                    size_t delay_ms = std::chrono::duration_cast<std::chrono::milliseconds>(
+                        next_refresh_with_spread - now).count();
+
+                    /// If we're in a test that fakes the clock, poll every 100ms.
+                    if (fake_clock.load(std::memory_order_relaxed) != INT64_MIN)
+                        delay_ms = 100;
+
+                    refresh_task->scheduleAfter(delay_ms);
+                    info.state = RefreshState::Scheduled;
+                    break;
+                }
+            }
+
+            /// Perform a refresh.
+
+            refresh_immediately = false;
+
+            auto view = lockView();
+            if (!view)
+            {
+                /// The view was dropped. This RefreshTask should be destroyed soon too.
+                /// (Maybe this is unreachable.)
+                info.state = RefreshState::Disabled;
+                break;
+            }
+
+            info.state = RefreshState::Running;
+
+            CurrentMetrics::Increment metric_inc(CurrentMetrics::RefreshingViews);
+
+            lock.unlock();
+
+            bool refreshed = false;
+            std::optional<String> exception;
+            auto start_time = std::chrono::steady_clock::now();
+
+            try
+            {
+                executeRefreshUnlocked(view);
+                refreshed = true;
+            }
+            catch (...)
+            {
+                if (!interrupt_execution.load())
+                {
+                    PreformattedMessage message = getCurrentExceptionMessageAndPattern(true);
+                    auto text = message.text;
+                    message.text = fmt::format("Refresh failed: {}", message.text);
+                    LOG_ERROR(log, message);
+                    exception = text;
+                }
+            }
+
+            lock.lock();
+
+            auto now = currentTime();
+            auto secs = std::chrono::floor<std::chrono::seconds>(now);
+            info.last_attempt_time = UInt32(secs.time_since_epoch().count());
+            info.last_attempt_duration_ms = std::chrono::duration_cast<std::chrono::milliseconds>(std::chrono::steady_clock::now() - start_time).count();
+
+            if (exception)
+            {
+                info.last_refresh_result = LastRefreshResult::Exception;
+                info.exception_message = *exception;
+
+                /// TODO: Do a few retries with exponential backoff.
+                advanceNextRefreshTime(now);
+            }
+            else if (!refreshed)
+            {
+                info.last_refresh_result = LastRefreshResult::Cancelled;
+
+                /// Make sure we don't just start another refresh immediately.
+                if (!stop_requested && now >= next_refresh_with_spread)
+                    advanceNextRefreshTime(now);
+            }
+            else
+            {
+                info.last_refresh_result = LastRefreshResult::Finished;
+                info.last_success_time = info.last_attempt_time;
+                info.refresh_count += 1;
+                advanceNextRefreshTime(now);
+
+                auto next_time = next_refresh_prescribed;
+
+                lock.unlock();
+                StorageID my_id = view->getStorageID();
+                auto dependents = view->getContext()->getRefreshSet().getDependents(my_id);
+                for (const RefreshTaskHolder & dep_task : dependents)
+                    dep_task->notify(my_id, next_time);
+                lock.lock();
+            }
+        }
+    }
+    catch (...)
+    {
+        std::unique_lock lock(mutex);
+        stop_requested = true;
+        tryLogCurrentException(log,
+            "Unexpected exception in refresh scheduling, please investigate. The view will be stopped.");
+#ifdef ABORT_ON_LOGICAL_ERROR
+        abortOnFailedAssertion("Unexpected exception in refresh scheduling");
+#endif
+    }
+}
+
+void RefreshTask::executeRefreshUnlocked(std::shared_ptr<StorageMaterializedView> view)
+{
+    LOG_DEBUG(log, "Refreshing view {}", view->getStorageID().getFullTableName());
+    progress.reset();
+
+    /// Create a table.
+    auto [refresh_context, refresh_query] = view->prepareRefresh();
+
+    StorageID stale_table = StorageID::createEmpty();
+    try
+    {
+        /// Run the query.
+        {
+            CurrentThread::QueryScope query_scope(refresh_context); // create a thread group for the query
+
+            BlockIO block_io = InterpreterInsertQuery(refresh_query, refresh_context).execute();
+            QueryPipeline & pipeline = block_io.pipeline;
+
+            pipeline.setProgressCallback([this](const Progress & prog)
+            {
+                /// TODO: Investigate why most fields are not populated. Change columns in system.view_refreshes as needed, update documentation (docs/en/operations/system-tables/view_refreshes.md).
+                progress.incrementPiecewiseAtomically(prog);
+            });
+
+            /// Add the query to system.processes and allow it to be killed with KILL QUERY.
+            String query_for_logging = refresh_query->formatForLogging(
+                refresh_context->getSettingsRef().log_queries_cut_to_length);
+            block_io.process_list_entry = refresh_context->getProcessList().insert(
+                query_for_logging, refresh_query.get(), refresh_context, Stopwatch{CLOCK_MONOTONIC}.getStart());
+            pipeline.setProcessListElement(block_io.process_list_entry->getQueryStatus());
+            refresh_context->setProcessListElement(block_io.process_list_entry->getQueryStatus());
+
+            if (!pipeline.completed())
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Pipeline for view refresh must be completed");
+
+            PipelineExecutor executor(pipeline.processors, pipeline.process_list_element);
+            executor.setReadProgressCallback(pipeline.getReadProgressCallback());
+
+            {
+                std::unique_lock exec_lock(executor_mutex);
+                if (interrupt_execution.load())
+                    throw Exception(ErrorCodes::QUERY_WAS_CANCELLED, "Refresh cancelled");
+                running_executor = &executor;
+            }
+            SCOPE_EXIT({
+                std::unique_lock exec_lock(executor_mutex);
+                running_executor = nullptr;
+            });
+
+            executor.execute(pipeline.getNumThreads(), pipeline.getConcurrencyControl());
+
+            /// A cancelled PipelineExecutor may return without exception but with incomplete results.
+            /// In this case make sure to:
+            ///  * report exception rather than success,
+            ///  * do it before destroying the QueryPipeline; otherwise it may fail assertions about
+            ///    being unexpectedly destroyed before completion and without uncaught exception
+            ///    (specifically, the assert in ~WriteBuffer()).
+            if (interrupt_execution.load())
+                throw Exception(ErrorCodes::QUERY_WAS_CANCELLED, "Refresh cancelled");
+        }
+
+        /// Exchange tables.
+        stale_table = view->exchangeTargetTable(refresh_query->table_id, refresh_context);
+    }
+    catch (...)
+    {
+        try
+        {
+            InterpreterDropQuery::executeDropQuery(
+                ASTDropQuery::Kind::Drop, view->getContext(), refresh_context, refresh_query->table_id, /*sync*/ false, /*ignore_sync_setting*/ true);
+        }
+        catch (...)
+        {
+            tryLogCurrentException(log, "Failed to drop temporary table after a failed refresh");
+            /// Let's ignore this and keep going, at risk of accumulating many trash tables if this keeps happening.
+        }
+        throw;
+    }
+
+    /// Drop the old table (outside the try-catch so we don't try to drop the other table if this fails).
+    InterpreterDropQuery::executeDropQuery(ASTDropQuery::Kind::Drop, view->getContext(), refresh_context, stale_table, /*sync*/ true, /*ignore_sync_setting*/ true);
+}
+
+void RefreshTask::advanceNextRefreshTime(std::chrono::system_clock::time_point now)
+{
+    std::chrono::sys_seconds next = refresh_schedule.prescribeNext(next_refresh_prescribed, now);
+    next_refresh_prescribed = next;
+    next_refresh_with_spread = refresh_schedule.addRandomSpread(next);
+
+    auto secs = std::chrono::floor<std::chrono::seconds>(next_refresh_with_spread);
+    info.next_refresh_time = UInt32(secs.time_since_epoch().count());
+}
+
+bool RefreshTask::arriveDependency(const StorageID & parent)
+{
+    remaining_dependencies.erase(parent);
+    if (!remaining_dependencies.empty() || !time_arrived)
+        return false;
+    populateDependencies();
+    return true;
+}
+
+bool RefreshTask::arriveTime()
+{
+    time_arrived = true;
+    if (!remaining_dependencies.empty() || !time_arrived)
+        return false;
+    populateDependencies();
+    return true;
+}
+
+void RefreshTask::populateDependencies()
+{
+    chassert(remaining_dependencies.empty());
+    auto deps = set_handle.getDependencies();
+    remaining_dependencies.insert(deps.begin(), deps.end());
+    time_arrived = false;
+}
+
+void RefreshTask::interruptExecution()
+{
+    chassert(!mutex.try_lock());
+    std::unique_lock lock(executor_mutex);
+    if (interrupt_execution.exchange(true))
+        return;
+    if (running_executor)
+    {
+        running_executor->cancel();
+
+        LOG_DEBUG(log, "Cancelling refresh");
+    }
+}
+
+std::shared_ptr<StorageMaterializedView> RefreshTask::lockView()
+{
+    return std::static_pointer_cast<StorageMaterializedView>(view_to_refresh.lock());
+}
+
+std::chrono::system_clock::time_point RefreshTask::currentTime() const
+{
+    Int64 fake = fake_clock.load(std::memory_order::relaxed);
+    if (fake == INT64_MIN)
+        return std::chrono::system_clock::now();
+    else
+        return std::chrono::system_clock::time_point(std::chrono::seconds(fake));
+}
+
+}
diff --git a/src/Storages/MaterializedView/RefreshTask.h b/src/Storages/MaterializedView/RefreshTask.h
new file mode 100644
index 00000000000..8a062f6f359
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshTask.h
@@ -0,0 +1,150 @@
+#pragma once
+
+#include <Storages/MaterializedView/RefreshSet.h>
+#include <Storages/MaterializedView/RefreshTask_fwd.h>
+#include <Storages/MaterializedView/RefreshSchedule.h>
+#include <Storages/MaterializedView/RefreshSettings.h>
+
+#include <Core/BackgroundSchedulePool.h>
+
+#include <random>
+
+
+namespace DB
+{
+
+class PipelineExecutor;
+
+class StorageMaterializedView;
+class ASTRefreshStrategy;
+
+class RefreshTask : public std::enable_shared_from_this<RefreshTask>
+{
+public:
+    /// Never call it manually, public for shared_ptr construction only
+    explicit RefreshTask(const ASTRefreshStrategy & strategy);
+
+    /// The only proper way to construct task
+    static RefreshTaskHolder create(
+        const StorageMaterializedView & view,
+        ContextMutablePtr context,
+        const DB::ASTRefreshStrategy & strategy);
+
+    void initializeAndStart(std::shared_ptr<StorageMaterializedView> view);
+
+    /// Call when renaming the materialized view.
+    void rename(StorageID new_id);
+
+    /// Call when changing refresh params (ALTER MODIFY REFRESH).
+    void alterRefreshParams(const DB::ASTRefreshStrategy & new_strategy);
+
+    RefreshInfo getInfo() const;
+
+    /// Enable task scheduling
+    void start();
+
+    /// Disable task scheduling
+    void stop();
+
+    /// Schedule task immediately
+    void run();
+
+    /// Cancel task execution
+    void cancel();
+
+    /// Permanently disable task scheduling and remove this table from RefreshSet.
+    void shutdown();
+
+    /// Notify dependent task
+    void notify(const StorageID & parent_id, std::chrono::sys_seconds parent_next_prescribed_time);
+
+    /// For tests
+    void setFakeTime(std::optional<Int64> t);
+
+private:
+    Poco::Logger * log = nullptr;
+    std::weak_ptr<IStorage> view_to_refresh;
+
+    /// Protects interrupt_execution and running_executor.
+    /// Can be locked while holding `mutex`.
+    std::mutex executor_mutex;
+    /// If there's a refresh in progress, it can be aborted by setting this flag and cancel()ling
+    /// this executor. Refresh task will then reconsider what to do, re-checking `stop_requested`,
+    /// `cancel_requested`, etc.
+    std::atomic_bool interrupt_execution {false};
+    PipelineExecutor * running_executor = nullptr;
+
+    /// Protects all fields below.
+    /// Never locked for blocking operations (e.g. creating or dropping the internal table).
+    /// Can't be locked while holding `executor_mutex`.
+    mutable std::mutex mutex;
+
+    RefreshSchedule refresh_schedule;
+    RefreshSettings refresh_settings; // TODO: populate, use, update on alter
+    RefreshSet::Handle set_handle;
+
+    /// StorageIDs of our dependencies that we're waiting for.
+    DatabaseAndTableNameSet remaining_dependencies;
+    bool time_arrived = false;
+
+    /// Refreshes are stopped (e.g. by SYSTEM STOP VIEW).
+    bool stop_requested = false;
+
+    /// If true, we should start a refresh right away. All refreshes go through this flag.
+    bool refresh_immediately = false;
+
+    /// When to refresh next. Updated when a refresh is finished or cancelled.
+    /// We maintain the distinction between:
+    ///  * The "prescribed" time of the refresh, dictated by the refresh schedule.
+    ///    E.g. for REFERSH EVERY 1 DAY, the prescribed time is always at the exact start of a day.
+    ///  * Actual wall clock timestamps, e.g. when the refresh is scheduled to happen
+    ///    (including random spread) or when a refresh completed.
+    /// The prescribed time is required for:
+    ///  * Doing REFRESH EVERY correctly if the random spread came up negative, and a refresh completed
+    ///    before the prescribed time. E.g. suppose a refresh was prescribed at 05:00, which was randomly
+    ///    adjusted to 4:50, and the refresh completed at 4:55; we shouldn't schedule another refresh
+    ///    at 5:00, so we should remember that the 4:50-4:55 refresh actually had prescribed time 5:00.
+    ///  * Similarly, for dependencies between REFRESH EVERY tables, using actual time would be unreliable.
+    ///    E.g. for REFRESH EVERY 1 DAY, yesterday's refresh of the dependency shouldn't trigger today's
+    ///    refresh of the dependent even if it happened today (e.g. it was slow or had random spread > 1 day).
+    std::chrono::sys_seconds next_refresh_prescribed;
+    std::chrono::system_clock::time_point next_refresh_with_spread;
+
+    /// Calls refreshTask() from background thread.
+    BackgroundSchedulePool::TaskHolder refresh_task;
+
+    /// Used in tests. If not INT64_MIN, we pretend that this is the current time, instead of calling system_clock::now().
+    std::atomic<Int64> fake_clock {INT64_MIN};
+
+    /// Just for observability.
+    RefreshInfo info;
+    Progress progress;
+
+    /// The main loop of the refresh task. It examines the state, sees what needs to be
+    /// done and does it. If there's nothing to do at the moment, returns; it's then scheduled again,
+    /// when needed, by public methods or by timer.
+    ///
+    /// Public methods just provide inputs for the refreshTask()'s decisions
+    /// (e.g. stop_requested, cancel_requested), they don't do anything significant themselves.
+    void refreshTask();
+
+    /// Perform an actual refresh: create new table, run INSERT SELECT, exchange tables, drop old table.
+    /// Mutex must be unlocked. Called only from refresh_task.
+    void executeRefreshUnlocked(std::shared_ptr<StorageMaterializedView> view);
+
+    /// Assigns next_refresh_*
+    void advanceNextRefreshTime(std::chrono::system_clock::time_point now);
+
+    /// Returns true if all dependencies are fulfilled now. Refills remaining_dependencies in this case.
+    bool arriveDependency(const StorageID & parent);
+    bool arriveTime();
+    void populateDependencies();
+
+    void interruptExecution();
+
+    std::shared_ptr<StorageMaterializedView> lockView();
+
+    std::chrono::system_clock::time_point currentTime() const;
+};
+
+}
diff --git a/src/Storages/MaterializedView/RefreshTask_fwd.h b/src/Storages/MaterializedView/RefreshTask_fwd.h
new file mode 100644
index 00000000000..1f366962eb6
--- /dev/null
+++ b/src/Storages/MaterializedView/RefreshTask_fwd.h
@@ -0,0 +1,15 @@
+#pragma once
+
+#include <base/types.h>
+#include <memory>
+
+namespace DB
+{
+
+class RefreshTask;
+
+using RefreshTaskStateUnderlying = UInt8;
+using RefreshTaskHolder = std::shared_ptr<RefreshTask>;
+using RefreshTaskObserver = std::weak_ptr<RefreshTask>;
+
+}
diff --git a/src/Storages/MergeTree/ActiveDataPartSet.cpp b/src/Storages/MergeTree/ActiveDataPartSet.cpp
index 89e01008945..ba95da37b29 100644
--- a/src/Storages/MergeTree/ActiveDataPartSet.cpp
+++ b/src/Storages/MergeTree/ActiveDataPartSet.cpp
@@ -39,6 +39,38 @@ bool ActiveDataPartSet::add(const MergeTreePartInfo & part_info, const String &
     return outcome == AddPartOutcome::Added;
 }
 
+void ActiveDataPartSet::checkIntersectingParts(const MergeTreePartInfo & part_info) const
+{
+    auto it = part_info_to_name.lower_bound(part_info);
+    /// Let's go left.
+    while (it != part_info_to_name.begin())
+    {
+        --it;
+        if (!part_info.contains(it->first))
+        {
+            if (!part_info.isDisjoint(it->first))
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Part {} intersects previous part {}. It is a bug or a result of manual intervention in the ZooKeeper data.", part_info.getPartNameForLogs(), it->first.getPartNameForLogs());
+            ++it;
+            break;
+        }
+    }
+    /// Let's go to the right.
+    while (it != part_info_to_name.end() && part_info.contains(it->first))
+    {
+        assert(part_info != it->first);
+        ++it;
+    }
+
+    if (it != part_info_to_name.end() && !part_info.isDisjoint(it->first))
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "Part {} intersects next part {}. It is a bug or a result of manual intervention in the ZooKeeper data.", part_info.getPartNameForLogs(), it->first.getPartNameForLogs());
+
+}
+
+void ActiveDataPartSet::checkIntersectingParts(const String & name) const
+{
+    auto part_info = MergeTreePartInfo::fromPartName(name, format_version);
+    checkIntersectingParts(part_info);
+}
 
 bool ActiveDataPartSet::add(const String & name, Strings * out_replaced_parts)
 {
diff --git a/src/Storages/MergeTree/ActiveDataPartSet.h b/src/Storages/MergeTree/ActiveDataPartSet.h
index 98a06e02ae8..3c644c89b8c 100644
--- a/src/Storages/MergeTree/ActiveDataPartSet.h
+++ b/src/Storages/MergeTree/ActiveDataPartSet.h
@@ -106,11 +106,16 @@ public:
 
     MergeTreeDataFormatVersion getFormatVersion() const { return format_version; }
 
+    void checkIntersectingParts(const MergeTreePartInfo & part_info) const;
+    void checkIntersectingParts(const String & name) const;
+
 private:
 
     AddPartOutcome addImpl(const MergeTreePartInfo & part_info, const String & name, Strings * out_replaced_parts = nullptr, String * out_reason = nullptr);
     MergeTreeDataFormatVersion format_version;
-    std::map<MergeTreePartInfo, String> part_info_to_name;
+
+    using PartInfoToName = std::map<MergeTreePartInfo, String>;
+    PartInfoToName part_info_to_name;
 
     std::vector<std::map<MergeTreePartInfo, String>::const_iterator> getPartsCoveredByImpl(const MergeTreePartInfo & part_info) const;
 
diff --git a/src/Storages/MergeTree/AsyncBlockIDsCache.cpp b/src/Storages/MergeTree/AsyncBlockIDsCache.cpp
index a9cdd09e061..cc3bc8fc2a8 100644
--- a/src/Storages/MergeTree/AsyncBlockIDsCache.cpp
+++ b/src/Storages/MergeTree/AsyncBlockIDsCache.cpp
@@ -18,6 +18,7 @@ namespace CurrentMetrics
 namespace DB
 {
 
+static constexpr int FAILURE_RETRY_MS = 3000;
 
 template <typename TStorage>
 struct AsyncBlockIDsCache<TStorage>::Cache : public std::unordered_set<String>
@@ -29,35 +30,12 @@ struct AsyncBlockIDsCache<TStorage>::Cache : public std::unordered_set<String>
     {}
 };
 
-template <typename TStorage>
-std::vector<String> AsyncBlockIDsCache<TStorage>::getChildren()
-{
-    auto zookeeper = storage.getZooKeeper();
-
-    auto watch_callback = [last_time = this->last_updatetime.load()
-                           , my_update_min_interval = this->update_min_interval
-                           , my_task = task->shared_from_this()](const Coordination::WatchResponse &)
-    {
-        auto now = std::chrono::steady_clock::now();
-        if (now - last_time < my_update_min_interval)
-        {
-            std::chrono::milliseconds sleep_time = std::chrono::duration_cast<std::chrono::milliseconds>(my_update_min_interval - (now - last_time));
-            my_task->scheduleAfter(sleep_time.count());
-        }
-        else
-            my_task->schedule();
-    };
-    std::vector<String> children;
-    Coordination::Stat stat;
-    zookeeper->tryGetChildrenWatch(path, children, &stat, watch_callback);
-    return children;
-}
-
 template <typename TStorage>
 void AsyncBlockIDsCache<TStorage>::update()
 try
 {
-    std::vector<String> paths = getChildren();
+    auto zookeeper = storage.getZooKeeper();
+    std::vector<String> paths = zookeeper->getChildren(path);
     std::unordered_set<String> set;
     for (String & p : paths)
     {
@@ -69,21 +47,20 @@ try
         ++version;
     }
     cv.notify_all();
-    last_updatetime = std::chrono::steady_clock::now();
 }
 catch (...)
 {
     LOG_INFO(log, "Updating async block ids cache failed. Reason: {}", getCurrentExceptionMessage(false));
-    task->scheduleAfter(update_min_interval.count());
+    task->scheduleAfter(FAILURE_RETRY_MS);
 }
 
 template <typename TStorage>
 AsyncBlockIDsCache<TStorage>::AsyncBlockIDsCache(TStorage & storage_)
-    : storage(storage_),
-    update_min_interval(storage.getSettings()->async_block_ids_cache_min_update_interval_ms),
-    path(storage.getZooKeeperPath() + "/async_blocks"),
-    log_name(storage.getStorageID().getFullTableName() + " (AsyncBlockIDsCache)"),
-    log(&Poco::Logger::get(log_name))
+    : storage(storage_)
+    , update_wait(storage.getSettings()->async_block_ids_cache_update_wait_ms)
+    , path(storage.getZooKeeperPath() + "/async_blocks")
+    , log_name(storage.getStorageID().getFullTableName() + " (AsyncBlockIDsCache)")
+    , log(&Poco::Logger::get(log_name))
 {
     task = storage.getContext()->getSchedulePool().createTask(log_name, [this]{ update(); });
 }
@@ -95,6 +72,16 @@ void AsyncBlockIDsCache<TStorage>::start()
         task->activateAndSchedule();
 }
 
+template <typename TStorage>
+void AsyncBlockIDsCache<TStorage>::triggerCacheUpdate()
+{
+    /// Trigger task update. Watch-based updates may produce a lot of
+    /// redundant work in case of multiple replicas, so we use manually controlled updates
+    /// in case of duplicates
+    if (!task->schedule())
+        LOG_TRACE(log, "Task is already scheduled, will wait for update for {}ms", update_wait.count());
+}
+
 /// Caller will keep the version of last call. When the caller calls again, it will wait util gets a newer version.
 template <typename TStorage>
 Strings AsyncBlockIDsCache<TStorage>::detectConflicts(const Strings & paths, UInt64 & last_version)
@@ -102,21 +89,20 @@ Strings AsyncBlockIDsCache<TStorage>::detectConflicts(const Strings & paths, UIn
     if (!storage.getSettings()->use_async_block_ids_cache)
         return {};
 
-    std::unique_lock lk(mu);
-    /// For first time access of this cache, the `last_version` is zero, so it will not block here.
-    /// For retrying request, We compare the request version and cache version, because zk only returns
-    /// incomplete information of duplication, we need to update the cache to find out more duplication.
-    /// The timeout here is to prevent deadlock, just in case.
-    cv.wait_for(lk, update_min_interval * 2, [&]{return version != last_version;});
-
-    if (version == last_version)
-        LOG_INFO(log, "Read cache with a old version {}", last_version);
-
     CachePtr cur_cache;
-    cur_cache = cache_ptr;
-    last_version = version;
+    {
+        std::unique_lock lk(mu);
+        /// For first time access of this cache, the `last_version` is zero, so it will not block here.
+        /// For retrying request, We compare the request version and cache version, because zk only returns
+        /// incomplete information of duplication, we need to update the cache to find out more duplication.
+        cv.wait_for(lk, update_wait, [&]{return version != last_version;});
 
-    lk.unlock();
+        if (version == last_version)
+            LOG_INFO(log, "Read cache with a old version {}", last_version);
+
+        cur_cache = cache_ptr;
+        last_version = version;
+    }
 
     if (cur_cache == nullptr)
         return {};
diff --git a/src/Storages/MergeTree/AsyncBlockIDsCache.h b/src/Storages/MergeTree/AsyncBlockIDsCache.h
index fbd97fd00ff..38c38da0033 100644
--- a/src/Storages/MergeTree/AsyncBlockIDsCache.h
+++ b/src/Storages/MergeTree/AsyncBlockIDsCache.h
@@ -14,8 +14,6 @@ class AsyncBlockIDsCache
     struct Cache;
     using CachePtr = std::shared_ptr<Cache>;
 
-    std::vector<String> getChildren();
-
     void update();
 
 public:
@@ -27,12 +25,13 @@ public:
 
     Strings detectConflicts(const Strings & paths, UInt64 & last_version);
 
+    void triggerCacheUpdate();
+
 private:
 
     TStorage & storage;
 
-    std::atomic<std::chrono::steady_clock::time_point> last_updatetime;
-    const std::chrono::milliseconds update_min_interval;
+    const std::chrono::milliseconds update_wait;
 
     std::mutex mu;
     CachePtr cache_ptr;
diff --git a/src/Storages/MergeTree/BackgroundJobsAssignee.cpp b/src/Storages/MergeTree/BackgroundJobsAssignee.cpp
index 32714b3b07f..56a4378cf9a 100644
--- a/src/Storages/MergeTree/BackgroundJobsAssignee.cpp
+++ b/src/Storages/MergeTree/BackgroundJobsAssignee.cpp
@@ -60,10 +60,11 @@ bool BackgroundJobsAssignee::scheduleMergeMutateTask(ExecutableTaskPtr merge_tas
 }
 
 
-void BackgroundJobsAssignee::scheduleFetchTask(ExecutableTaskPtr fetch_task)
+bool BackgroundJobsAssignee::scheduleFetchTask(ExecutableTaskPtr fetch_task)
 {
     bool res = getContext()->getFetchesExecutor()->trySchedule(fetch_task);
     res ? trigger() : postpone();
+    return res;
 }
 
 
@@ -75,10 +76,11 @@ bool BackgroundJobsAssignee::scheduleMoveTask(ExecutableTaskPtr move_task)
 }
 
 
-void BackgroundJobsAssignee::scheduleCommonTask(ExecutableTaskPtr common_task, bool need_trigger)
+bool BackgroundJobsAssignee::scheduleCommonTask(ExecutableTaskPtr common_task, bool need_trigger)
 {
-    bool res = getContext()->getCommonExecutor()->trySchedule(common_task) && need_trigger;
-    res ? trigger() : postpone();
+    bool schedule_res = getContext()->getCommonExecutor()->trySchedule(common_task);
+    schedule_res && need_trigger ? trigger() : postpone();
+    return schedule_res;
 }
 
 
diff --git a/src/Storages/MergeTree/BackgroundJobsAssignee.h b/src/Storages/MergeTree/BackgroundJobsAssignee.h
index f1c7eadf5f7..65fefce0917 100644
--- a/src/Storages/MergeTree/BackgroundJobsAssignee.h
+++ b/src/Storages/MergeTree/BackgroundJobsAssignee.h
@@ -66,9 +66,9 @@ public:
     void finish();
 
     bool scheduleMergeMutateTask(ExecutableTaskPtr merge_task);
-    void scheduleFetchTask(ExecutableTaskPtr fetch_task);
+    bool scheduleFetchTask(ExecutableTaskPtr fetch_task);
     bool scheduleMoveTask(ExecutableTaskPtr move_task);
-    void scheduleCommonTask(ExecutableTaskPtr common_task, bool need_trigger);
+    bool scheduleCommonTask(ExecutableTaskPtr common_task, bool need_trigger);
 
     /// Just call finish
     ~BackgroundJobsAssignee();
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
index 0c7c50a687b..6c1377505d5 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskBase.cpp
@@ -5,6 +5,7 @@
 #include <IO/ReadBufferFromString.h>
 #include <IO/ReadHelpers.h>
 #include <Common/logger_useful.h>
+#include <Common/formatReadable.h>
 #include <Interpreters/Context.h>
 #include <Storages/MergeTree/localBackup.h>
 #include <Backups/BackupEntryFromSmallFile.h>
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp b/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
index 20b6c5a919e..94f636423cc 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskFull.cpp
@@ -184,6 +184,23 @@ void DataPartStorageOnDiskFull::createHardLinkFrom(const IDataPartStorage & sour
     });
 }
 
+void DataPartStorageOnDiskFull::copyFileFrom(const IDataPartStorage & source, const std::string & from, const std::string & to)
+{
+    const auto * source_on_disk = typeid_cast<const DataPartStorageOnDiskFull *>(&source);
+    if (!source_on_disk)
+        throw Exception(
+            ErrorCodes::LOGICAL_ERROR,
+            "Cannot create copy file from different storage. Expected DataPartStorageOnDiskFull, got {}",
+            typeid(source).name());
+
+    /// Copying files between different disks is
+    /// not supported in disk transactions.
+    source_on_disk->getDisk()->copyFile(
+        fs::path(source_on_disk->getRelativePath()) / from,
+        *volume->getDisk(),
+        fs::path(root_path) / part_dir / to);
+}
+
 void DataPartStorageOnDiskFull::createProjection(const std::string & name)
 {
     executeWriteOperation([&](auto & disk) { disk.createDirectory(fs::path(root_path) / part_dir / name); });
diff --git a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
index 5d70404fcfa..15c6d42c721 100644
--- a/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
+++ b/src/Storages/MergeTree/DataPartStorageOnDiskFull.h
@@ -48,6 +48,7 @@ public:
     void removeFileIfExists(const String & name) override;
 
     void createHardLinkFrom(const IDataPartStorage & source, const std::string & from, const std::string & to) override;
+    void copyFileFrom(const IDataPartStorage & source, const std::string & from, const std::string & to) override;
 
     void beginTransaction() override;
     void commitTransaction() override;
diff --git a/src/Storages/MergeTree/DataPartsExchange.cpp b/src/Storages/MergeTree/DataPartsExchange.cpp
index 2bf2f9fddc7..c54947dde8e 100644
--- a/src/Storages/MergeTree/DataPartsExchange.cpp
+++ b/src/Storages/MergeTree/DataPartsExchange.cpp
@@ -522,11 +522,10 @@ std::pair<MergeTreeData::MutableDataPartPtr, scope_guard> Fetcher::fetchSelected
         uri,
         Poco::Net::HTTPRequest::HTTP_POST,
         nullptr,
-        timeouts,
         creds,
         DBMS_DEFAULT_BUFFER_SIZE,
         0, /* no redirects */
-        static_cast<uint64_t>(data_settings->replicated_max_parallel_fetches_for_host));
+        context->getCommonFetchesSessionFactory());
 
     int server_protocol_version = parse<int>(in->getResponseCookie("server_protocol_version", "0"));
     String remote_fs_metadata = parse<String>(in->getResponseCookie("remote_fs_metadata", ""));
diff --git a/src/Storages/MergeTree/IDataPartStorage.h b/src/Storages/MergeTree/IDataPartStorage.h
index 59251e40626..afbe91a8a6d 100644
--- a/src/Storages/MergeTree/IDataPartStorage.h
+++ b/src/Storages/MergeTree/IDataPartStorage.h
@@ -12,6 +12,7 @@
 #include <optional>
 #include <Common/ZooKeeper/ZooKeeper.h>
 #include <Disks/IDiskTransaction.h>
+#include <Storages/MergeTree/MergeTreeDataPartChecksum.h>
 
 namespace DB
 {
@@ -304,6 +305,7 @@ public:
     virtual SyncGuardPtr getDirectorySyncGuard() const { return nullptr; }
 
     virtual void createHardLinkFrom(const IDataPartStorage & source, const std::string & from, const std::string & to) = 0;
+    virtual void copyFileFrom(const IDataPartStorage & source, const std::string & from, const std::string & to) = 0;
 
     /// Rename part.
     /// Ideally, new_root_path should be the same as current root (but it is not true).
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.cpp b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
index 38ecd8f4067..87f23b0da2a 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.cpp
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.cpp
@@ -1142,6 +1142,7 @@ void IMergeTreeDataPart::loadChecksums(bool require)
         {
             assertEOF(*buf);
             bytes_on_disk = checksums.getTotalSizeOnDisk();
+            bytes_uncompressed_on_disk = checksums.getTotalSizeUncompressedOnDisk();
         }
         else
             bytes_on_disk = getDataPartStorage().calculateTotalSizeOnDisk();
@@ -1159,6 +1160,7 @@ void IMergeTreeDataPart::loadChecksums(bool require)
         writeChecksums(checksums, {});
 
         bytes_on_disk = checksums.getTotalSizeOnDisk();
+        bytes_uncompressed_on_disk = checksums.getTotalSizeUncompressedOnDisk();
     }
 }
 
diff --git a/src/Storages/MergeTree/IMergeTreeDataPart.h b/src/Storages/MergeTree/IMergeTreeDataPart.h
index 06e0712646a..640a1f1d0a3 100644
--- a/src/Storages/MergeTree/IMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/IMergeTreeDataPart.h
@@ -370,7 +370,9 @@ public:
     UInt64 getIndexSizeFromFile() const;
 
     UInt64 getBytesOnDisk() const { return bytes_on_disk; }
+    UInt64 getBytesUncompressedOnDisk() const { return bytes_uncompressed_on_disk; }
     void setBytesOnDisk(UInt64 bytes_on_disk_) { bytes_on_disk = bytes_on_disk_; }
+    void setBytesUncompressedOnDisk(UInt64 bytes_uncompressed_on_disk_) { bytes_uncompressed_on_disk = bytes_uncompressed_on_disk_; }
 
     size_t getFileSizeOrZero(const String & file_name) const;
     auto getFilesChecksums() const { return checksums.files; }
@@ -566,6 +568,7 @@ protected:
     /// Total size on disk, not only columns. May not contain size of
     /// checksums.txt and columns.txt. 0 - if not counted;
     UInt64 bytes_on_disk{0};
+    UInt64 bytes_uncompressed_on_disk{0};
 
     /// Columns description. Cannot be changed, after part initialization.
     NamesAndTypesList columns;
diff --git a/src/Storages/MergeTree/IMergeTreeReader.h b/src/Storages/MergeTree/IMergeTreeReader.h
index 02faebf4b41..f3ea0c6c361 100644
--- a/src/Storages/MergeTree/IMergeTreeReader.h
+++ b/src/Storages/MergeTree/IMergeTreeReader.h
@@ -86,13 +86,13 @@ protected:
     /// Actual serialization of columns in part.
     Serializations serializations;
 
-    UncompressedCache * uncompressed_cache;
-    MarkCache * mark_cache;
+    UncompressedCache * const uncompressed_cache;
+    MarkCache * const mark_cache;
 
     MergeTreeReaderSettings settings;
 
-    StorageSnapshotPtr storage_snapshot;
-    MarkRanges all_mark_ranges;
+    const StorageSnapshotPtr storage_snapshot;
+    const MarkRanges all_mark_ranges;
 
     /// Position and level (of nesting).
     using ColumnNameLevel = std::optional<std::pair<String, size_t>>;
diff --git a/src/Storages/MergeTree/KeyCondition.cpp b/src/Storages/MergeTree/KeyCondition.cpp
index 868428e3ea2..1cc672fb98f 100644
--- a/src/Storages/MergeTree/KeyCondition.cpp
+++ b/src/Storages/MergeTree/KeyCondition.cpp
@@ -3,6 +3,7 @@
 #include <DataTypes/DataTypesNumber.h>
 #include <DataTypes/DataTypeLowCardinality.h>
 #include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeNothing.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/FieldToDataType.h>
 #include <DataTypes/getLeastSupertype.h>
@@ -852,12 +853,10 @@ KeyCondition::KeyCondition(
     ContextPtr context,
     const Names & key_column_names,
     const ExpressionActionsPtr & key_expr_,
-    NameSet array_joined_column_names_,
     bool single_point_,
     bool strict_)
     : key_expr(key_expr_)
     , key_subexpr_names(getAllSubexpressionNames(*key_expr))
-    , array_joined_column_names(std::move(array_joined_column_names_))
     , single_point(single_point_)
     , strict(strict_)
 {
@@ -1642,6 +1641,15 @@ static void castValueToType(const DataTypePtr & desired_type, Field & src_value,
 
 bool KeyCondition::extractAtomFromTree(const RPNBuilderTreeNode & node, RPNElement & out)
 {
+    const auto * node_dag = node.getDAGNode();
+    if (node_dag && node_dag->result_type->equals(DataTypeNullable(std::make_shared<DataTypeNothing>())))
+    {
+        /// If the inferred result type is Nullable(Nothing) at the query analysis stage,
+        /// we don't analyze this node further as its condition will always be false.
+        out.function = RPNElement::ALWAYS_FALSE;
+        return true;
+    }
+
     /** Functions < > = != <= >= in `notIn` isNull isNotNull, where one argument is a constant, and the other is one of columns of key,
       *  or itself, wrapped in a chain of possibly-monotonic functions,
       *  (for example, if the table has ORDER BY time, we will check the conditions like
diff --git a/src/Storages/MergeTree/KeyCondition.h b/src/Storages/MergeTree/KeyCondition.h
index 3b430d80c4d..980c248835d 100644
--- a/src/Storages/MergeTree/KeyCondition.h
+++ b/src/Storages/MergeTree/KeyCondition.h
@@ -69,7 +69,6 @@ public:
         ContextPtr context,
         const Names & key_column_names,
         const ExpressionActionsPtr & key_expr,
-        NameSet array_joined_column_names,
         bool single_point_ = false,
         bool strict_ = false);
 
diff --git a/src/Storages/MergeTree/MergeTask.cpp b/src/Storages/MergeTree/MergeTask.cpp
index 2d1191033c7..786960beb37 100644
--- a/src/Storages/MergeTree/MergeTask.cpp
+++ b/src/Storages/MergeTree/MergeTask.cpp
@@ -7,6 +7,7 @@
 
 #include <Common/logger_useful.h>
 #include <Common/ActionBlocker.h>
+#include <Processors/Transforms/CheckSortedTransform.h>
 #include <Storages/LightweightDeleteDescription.h>
 #include <Storages/MergeTree/DataPartStorageOnDiskFull.h>
 
@@ -41,6 +42,7 @@ namespace ErrorCodes
     extern const int ABORTED;
     extern const int DIRECTORY_ALREADY_EXISTS;
     extern const int LOGICAL_ERROR;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 
@@ -165,7 +167,7 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
     std::optional<MergeTreeDataPartBuilder> builder;
     if (global_ctx->parent_part)
     {
-        auto data_part_storage = global_ctx->parent_part->getDataPartStorage().getProjection(local_tmp_part_basename);
+        auto data_part_storage = global_ctx->parent_part->getDataPartStorage().getProjection(local_tmp_part_basename,  /* use parent transaction */ false);
         builder.emplace(*global_ctx->data, global_ctx->future_part->name, data_part_storage);
         builder->withParentPart(global_ctx->parent_part);
     }
@@ -185,11 +187,11 @@ bool MergeTask::ExecuteAndFinalizeHorizontalPart::prepare()
     if (data_part_storage->exists())
         throw Exception(ErrorCodes::DIRECTORY_ALREADY_EXISTS, "Directory {} already exists", data_part_storage->getFullPath());
 
+    data_part_storage->beginTransaction();
+    /// Background temp dirs cleaner will not touch tmp projection directory because
+    /// it's located inside part's directory
     if (!global_ctx->parent_part)
-    {
-        data_part_storage->beginTransaction();
         global_ctx->temporary_directory_lock = global_ctx->data->getTemporaryPartDirectoryHolder(local_tmp_part_basename);
-    }
 
     global_ctx->all_column_names = global_ctx->metadata_snapshot->getColumns().getNamesOfPhysical();
     global_ctx->storage_columns = global_ctx->metadata_snapshot->getColumns().getAllPhysical();
@@ -496,7 +498,6 @@ bool MergeTask::VerticalMergeStage::prepareVerticalMergeForAllColumns() const
 
     size_t sum_input_rows_exact = global_ctx->merge_list_element_ptr->rows_read;
     size_t input_rows_filtered = *global_ctx->input_rows_filtered;
-    size_t cleanedup_rows_count = global_ctx->cleanedup_rows_count;
     global_ctx->merge_list_element_ptr->columns_written = global_ctx->merging_column_names.size();
     global_ctx->merge_list_element_ptr->progress.store(ctx->column_sizes->keyColumnsWeight(), std::memory_order_relaxed);
 
@@ -509,13 +510,12 @@ bool MergeTask::VerticalMergeStage::prepareVerticalMergeForAllColumns() const
     /// In special case, when there is only one source part, and no rows were skipped, we may have
     /// skipped writing rows_sources file. Otherwise rows_sources_count must be equal to the total
     /// number of input rows.
-    if ((rows_sources_count > 0 || global_ctx->future_part->parts.size() > 1)
-        && sum_input_rows_exact != rows_sources_count + input_rows_filtered + cleanedup_rows_count)
+    if ((rows_sources_count > 0 || global_ctx->future_part->parts.size() > 1) && sum_input_rows_exact != rows_sources_count + input_rows_filtered)
         throw Exception(
-            ErrorCodes::LOGICAL_ERROR,
-            "Number of rows in source parts ({}) excluding filtered rows ({}) and cleaned up rows ({}) differs from number "
-            "of bytes written to rows_sources file ({}). It is a bug.",
-            sum_input_rows_exact, input_rows_filtered, cleanedup_rows_count, rows_sources_count);
+                        ErrorCodes::LOGICAL_ERROR,
+                        "Number of rows in source parts ({}) excluding filtered rows ({}) differs from number "
+                        "of bytes written to rows_sources file ({}). It is a bug.",
+                        sum_input_rows_exact, input_rows_filtered, rows_sources_count);
 
     /// TemporaryDataOnDisk::createRawStream returns WriteBufferFromFile implementing IReadableWriteBuffer
     /// and we expect to get ReadBufferFromFile here.
@@ -574,6 +574,8 @@ void MergeTask::VerticalMergeStage::prepareVerticalMergeForOneColumn() const
             global_ctx->storage_snapshot,
             global_ctx->future_part->parts[part_num],
             column_names,
+            /*mark_ranges=*/ {},
+            /*apply_deleted_mask=*/ true,
             ctx->read_with_direct_io,
             /*take_column_types_from_storage=*/ true,
             /*quiet=*/ false,
@@ -927,6 +929,8 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
             global_ctx->storage_snapshot,
             part,
             global_ctx->merging_column_names,
+            /*mark_ranges=*/ {},
+            /*apply_deleted_mask=*/ true,
             ctx->read_with_direct_io,
             /*take_column_types_from_storage=*/ true,
             /*quiet=*/ false,
@@ -958,6 +962,22 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
     for (size_t i = 0; i < sort_columns_size; ++i)
         sort_description.emplace_back(sort_columns[i], 1, 1);
 
+#ifndef NDEBUG
+    if (!sort_description.empty())
+    {
+        for (size_t i = 0; i < pipes.size(); ++i)
+        {
+            auto & pipe = pipes[i];
+            pipe.addSimpleTransform([&](const Block & header_)
+            {
+                auto transform = std::make_shared<CheckSortedTransform>(header_, sort_description);
+                transform->setDescription(global_ctx->future_part->parts[i]->name);
+                return transform;
+            });
+        }
+    }
+#endif
+
     /// The order of the streams is important: when the key is matched, the elements go in the order of the source stream number.
     /// In the merged part, the lines with the same key must be in the ascending order of the identifier of original part,
     ///  that is going in insertion order.
@@ -1003,10 +1023,13 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
             break;
 
         case MergeTreeData::MergingParams::Replacing:
+            if (global_ctx->cleanup && !data_settings->allow_experimental_replacing_merge_with_cleanup)
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Experimental merges with CLEANUP are not allowed");
+
             merged_transform = std::make_shared<ReplacingSortedTransform>(
                 header, pipes.size(), sort_description, ctx->merging_params.is_deleted_column, ctx->merging_params.version_column,
                 merge_block_size_rows, merge_block_size_bytes, ctx->rows_sources_write_buf.get(), ctx->blocks_are_granules_size,
-                (data_settings->clean_deleted_rows != CleanDeletedRows::Never) || global_ctx->cleanup, &global_ctx->cleanedup_rows_count);
+                global_ctx->cleanup);
             break;
 
         case MergeTreeData::MergingParams::Graphite:
@@ -1025,6 +1048,17 @@ void MergeTask::ExecuteAndFinalizeHorizontalPart::createMergedStream()
     auto res_pipe = Pipe::unitePipes(std::move(pipes));
     res_pipe.addTransform(std::move(merged_transform));
 
+#ifndef NDEBUG
+    if (!sort_description.empty())
+    {
+        res_pipe.addSimpleTransform([&](const Block & header_)
+        {
+            auto transform = std::make_shared<CheckSortedTransform>(header_, sort_description);
+            return transform;
+        });
+    }
+#endif
+
     if (global_ctx->deduplicate)
     {
         /// We don't want to deduplicate by block number column
@@ -1084,6 +1118,8 @@ MergeAlgorithm MergeTask::ExecuteAndFinalizeHorizontalPart::chooseMergeAlgorithm
         return MergeAlgorithm::Horizontal;
     if (global_ctx->future_part->part_format.storage_type != MergeTreeDataPartStorageType::Full)
         return MergeAlgorithm::Horizontal;
+    if (global_ctx->cleanup)
+        return MergeAlgorithm::Horizontal;
 
     if (!data_settings->allow_vertical_merges_from_compact_to_wide_parts)
     {
diff --git a/src/Storages/MergeTree/MergeTask.h b/src/Storages/MergeTree/MergeTask.h
index 268d5f86cef..b2a5796737d 100644
--- a/src/Storages/MergeTree/MergeTask.h
+++ b/src/Storages/MergeTree/MergeTask.h
@@ -113,6 +113,13 @@ public:
         return global_ctx->promise.get_future();
     }
 
+    MergeTreeData::MutableDataPartPtr getUnfinishedPart()
+    {
+        if (global_ctx)
+            return global_ctx->new_data_part;
+        return nullptr;
+    }
+
     bool execute();
 
 private:
@@ -154,7 +161,6 @@ private:
         bool deduplicate{false};
         Names deduplicate_by_columns{};
         bool cleanup{false};
-        size_t cleanedup_rows_count{0};
 
         NamesAndTypesList gathering_columns{};
         NamesAndTypesList merging_columns{};
diff --git a/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp b/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp
index a5f503718b6..a3f8e02f5eb 100644
--- a/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeBackgroundExecutor.cpp
@@ -186,7 +186,8 @@ void MergeTreeBackgroundExecutor<Queue>::removeTasksCorrespondingToStorage(Stora
         try
         {
             /// An exception context is needed to proper delete write buffers without finalization
-            throw Exception(ErrorCodes::ABORTED, "Storage is about to be deleted. Done pending task as if it was aborted.");
+            /// See WriteBuffer::~WriteBuffer for more context
+            throw std::runtime_error("Storage is about to be deleted. Done pending task as if it was aborted.");
         }
         catch (...)
         {
diff --git a/src/Storages/MergeTree/MergeTreeData.cpp b/src/Storages/MergeTree/MergeTreeData.cpp
index d9d4654cd99..1c80778f1ca 100644
--- a/src/Storages/MergeTree/MergeTreeData.cpp
+++ b/src/Storages/MergeTree/MergeTreeData.cpp
@@ -194,6 +194,7 @@ namespace ErrorCodes
     extern const int SERIALIZATION_ERROR;
     extern const int TOO_MANY_MUTATIONS;
     extern const int CANNOT_SCHEDULE_TASK;
+    extern const int LIMIT_EXCEEDED;
 }
 
 static void checkSuspiciousIndices(const ASTFunction * index_function)
@@ -649,6 +650,10 @@ void MergeTreeData::checkProperties(
             if (projections_names.find(projection.name) != projections_names.end())
                 throw Exception(ErrorCodes::LOGICAL_ERROR, "Projection with name {} already exists", backQuote(projection.name));
 
+            const auto settings = getSettings();
+            if (projections_names.size() >= settings->max_projections)
+                throw Exception(ErrorCodes::LIMIT_EXCEEDED, "Maximum limit of {} projection(s) exceeded", settings->max_projections);
+
             /// We cannot alter a projection so far. So here we do not try to find a projection in old metadata.
             bool is_aggregate = projection.type == ProjectionDescription::Type::Aggregate;
             checkProperties(*projection.metadata, *projection.metadata, attach, is_aggregate, true /* allow_nullable_key */, local_context);
@@ -1651,22 +1656,39 @@ void MergeTreeData::loadDataParts(bool skip_sanity_checks, std::optional<std::un
             }
         }
 
+        std::unordered_set<String> skip_check_disks;
         for (const auto & [disk_name, disk] : getContext()->getDisksMap())
         {
             if (disk->isBroken() || disk->isCustomDisk())
+            {
+                skip_check_disks.insert(disk_name);
                 continue;
+            }
 
-            if (!defined_disk_names.contains(disk_name) && disk->exists(relative_data_path))
+            bool is_disk_defined = defined_disk_names.contains(disk_name);
+
+            if (!is_disk_defined && disk->exists(relative_data_path))
+            {
+                /// There still a chance that underlying disk is defined in storage policy
+                const auto & delegate = disk->getDelegateDiskIfExists();
+                is_disk_defined = delegate && !delegate->isBroken() && !delegate->isCustomDisk()
+                               && delegate->getPath() == disk->getPath()
+                               && defined_disk_names.contains(delegate->getName());
+            }
+
+            if (!is_disk_defined && disk->exists(relative_data_path))
             {
                 for (const auto it = disk->iterateDirectory(relative_data_path); it->isValid(); it->next())
                 {
-                    if (MergeTreePartInfo::tryParsePartName(it->name(), format_version))
-                    {
-                        throw Exception(
-                            ErrorCodes::UNKNOWN_DISK,
-                            "Part {} ({}) was found on disk {} which is not defined in the storage policy (defined disks: {})",
-                            backQuote(it->name()), backQuote(it->path()), backQuote(disk_name), fmt::join(defined_disk_names, ", "));
-                    }
+                    if (!MergeTreePartInfo::tryParsePartName(it->name(), format_version))
+                        continue; /// Cannot parse part name, some garbage on disk, just ignore it.
+                    /// But we can't ignore valid part name on undefined disk.
+                    throw Exception(
+                        ErrorCodes::UNKNOWN_DISK,
+                        "Part '{}' ({}) was found on disk '{}' which is not defined in the storage policy '{}' or broken"
+                        " (defined disks: [{}], skipped disks: [{}])",
+                        it->name(), it->path(), disk_name, getStoragePolicy()->getName(),
+                        fmt::join(defined_disk_names, ", "), fmt::join(skip_check_disks, ", "));
                 }
             }
         }
@@ -2058,6 +2080,9 @@ size_t MergeTreeData::clearOldTemporaryDirectories(const String & root_path, siz
         if (disk->isBroken())
             continue;
 
+        if (!disk->exists(root_path))
+            continue;
+
         for (auto it = disk->iterateDirectory(root_path); it->isValid(); it->next())
         {
             const std::string & basename = it->name();
@@ -2340,6 +2365,7 @@ void MergeTreeData::removePartsFinally(const MergeTreeData::DataPartsVector & pa
             part_log_elem.partition_id = part->info.partition_id;
             part_log_elem.part_name = part->name;
             part_log_elem.bytes_compressed_on_disk = part->getBytesOnDisk();
+            part_log_elem.bytes_uncompressed = part->getBytesUncompressedOnDisk();
             part_log_elem.rows = part->rows_count;
             part_log_elem.part_type = part->getType();
 
@@ -2758,6 +2784,25 @@ void MergeTreeData::dropAllData()
 
     column_sizes.clear();
 
+    auto detached_parts = getDetachedParts();
+    for (const auto & part : detached_parts)
+    {
+        bool is_zero_copy = supportsReplication() && part.disk->supportZeroCopyReplication()
+            && settings_ptr->allow_remote_fs_zero_copy_replication;
+        try
+        {
+            bool keep_shared = removeDetachedPart(part.disk, fs::path(relative_data_path) / "detached" / part.dir_name / "", part.dir_name);
+            LOG_DEBUG(log, "Dropped detached part {}, keep shared data: {}", part.dir_name, keep_shared);
+        }
+        catch (...)
+        {
+            /// Without zero-copy-replication we will simply remove it recursively, but with zero-copy it will leave garbage on s3
+            if (is_zero_copy && isRetryableException(std::current_exception()))
+                throw;
+            tryLogCurrentException(log);
+        }
+    }
+
     for (const auto & disk : getDisks())
     {
         if (disk->isBroken())
@@ -2775,7 +2820,7 @@ void MergeTreeData::dropAllData()
         disk->removeFileIfExists(fs::path(relative_data_path) / FORMAT_VERSION_FILE_NAME);
 
         if (disk->exists(fs::path(relative_data_path) / DETACHED_DIR_NAME))
-            disk->removeRecursive(fs::path(relative_data_path) / DETACHED_DIR_NAME);
+            disk->removeSharedRecursive(fs::path(relative_data_path) / DETACHED_DIR_NAME, /*keep_all_shared_data*/ true, {});
 
         if (disk->exists(fs::path(relative_data_path) / MOVING_DIR_NAME))
             disk->removeRecursive(fs::path(relative_data_path) / MOVING_DIR_NAME);
@@ -2817,8 +2862,6 @@ void MergeTreeData::dropAllData()
 
 void MergeTreeData::dropIfEmpty()
 {
-    LOG_TRACE(log, "dropIfEmpty");
-
     auto lock = lockParts();
 
     if (!data_parts_by_info.empty())
@@ -2935,7 +2978,7 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
 
     if (!settings.allow_non_metadata_alters)
     {
-        auto mutation_commands = commands.getMutationCommands(new_metadata, settings.materialize_ttl_after_modify, getContext());
+        auto mutation_commands = commands.getMutationCommands(new_metadata, settings.materialize_ttl_after_modify, local_context);
 
         if (!mutation_commands.empty())
             throw Exception(ErrorCodes::ALTER_OF_COLUMN_IS_FORBIDDEN,
@@ -2944,7 +2987,7 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
                             queryToString(mutation_commands.ast()));
     }
 
-    commands.apply(new_metadata, getContext());
+    commands.apply(new_metadata, local_context);
 
     if (commands.hasInvertedIndex(new_metadata) && !settings.allow_experimental_inverted_index)
         throw Exception(ErrorCodes::SUPPORT_IS_DISABLED,
@@ -3060,6 +3103,9 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
         if (command.type == AlterCommand::MODIFY_QUERY)
             throw Exception(ErrorCodes::NOT_IMPLEMENTED,
                             "ALTER MODIFY QUERY is not supported by MergeTree engines family");
+        if (command.type == AlterCommand::MODIFY_REFRESH)
+            throw Exception(ErrorCodes::NOT_IMPLEMENTED,
+                            "ALTER MODIFY REFRESH is not supported by MergeTree engines family");
 
         if (command.type == AlterCommand::MODIFY_ORDER_BY && !is_custom_partitioned)
         {
@@ -3231,7 +3277,7 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
     if (!columns_to_check_conversion.empty())
     {
         auto old_header = old_metadata.getSampleBlock();
-        performRequiredConversions(old_header, columns_to_check_conversion, getContext());
+        performRequiredConversions(old_header, columns_to_check_conversion, local_context);
     }
 
     if (old_metadata.hasSettingsChanges())
@@ -3263,7 +3309,7 @@ void MergeTreeData::checkAlterIsPossible(const AlterCommands & commands, Context
             }
 
             if (setting_name == "storage_policy")
-                checkStoragePolicy(getContext()->getStoragePolicy(new_value.safeGet<String>()));
+                checkStoragePolicy(local_context->getStoragePolicy(new_value.safeGet<String>()));
         }
 
         /// Check if it is safe to reset the settings
@@ -3805,6 +3851,25 @@ void MergeTreeData::removePartsFromWorkingSet(MergeTreeTransaction * txn, const
         resetObjectColumnsFromActiveParts(acquired_lock);
 }
 
+void MergeTreeData::removePartsFromWorkingSetImmediatelyAndSetTemporaryState(const DataPartsVector & remove)
+{
+    auto lock = lockParts();
+
+    for (const auto & part : remove)
+    {
+        auto it_part = data_parts_by_info.find(part->info);
+        if (it_part == data_parts_by_info.end())
+            throw Exception(ErrorCodes::LOGICAL_ERROR, "Part {} not found in data_parts", part->getNameWithState());
+
+        assert(part->getState() == MergeTreeDataPartState::PreActive);
+
+        modifyPartState(part, MergeTreeDataPartState::Temporary);
+        /// Erase immediately
+        LOG_TEST(log, "removePartsFromWorkingSetImmediatelyAndSetTemporaryState: removing {} from data_parts_indexes", part->getNameWithState());
+        data_parts_indexes.erase(it_part);
+    }
+}
+
 void MergeTreeData::removePartsFromWorkingSet(
         MergeTreeTransaction * txn, const DataPartsVector & remove, bool clear_without_timeout, DataPartsLock * acquired_lock)
 {
@@ -4041,11 +4106,14 @@ void MergeTreeData::forcefullyMovePartToDetachedAndRemoveFromMemory(const MergeT
         Strings restored;
         Strings error_parts;
 
-        auto is_appropriate_state = [] (DataPartState state)
+        auto is_appropriate_state = [] (const DataPartPtr & part_)
         {
-            if (state != DataPartState::Outdated)
-                throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to restore a part from unexpected state: {}", state);
-            return true;
+            /// In rare cases, we may have a chain of unexpected parts that cover common source parts, e.g. all_1_2_3, all_1_3_4
+            /// It may happen as a result of interrupted cloneReplica
+            bool already_active = part_->getState() == DataPartState::Active;
+            if (!already_active && part_->getState() != DataPartState::Outdated)
+                throw Exception(ErrorCodes::LOGICAL_ERROR, "Trying to restore a part {} from unexpected state: {}", part_->name, part_->getState());
+            return !already_active;
         };
 
         auto activate_part = [this, &restored_active_part](auto it)
@@ -4089,7 +4157,7 @@ void MergeTreeData::forcefullyMovePartToDetachedAndRemoveFromMemory(const MergeT
         for (const auto & part_candidate_in_partition : parts_candidates | std::views::reverse)
         {
             if (part->info.contains(part_candidate_in_partition->info)
-                && is_appropriate_state(part_candidate_in_partition->getState()))
+                && is_appropriate_state(part_candidate_in_partition))
             {
                 String out_reason;
                 /// Outdated parts can itersect legally (because of DROP_PART) here it's okay, we
@@ -4828,10 +4896,18 @@ void MergeTreeData::checkPartitionCanBeDropped(const ASTPtr & partition, Context
         partition_size += part->getBytesOnDisk();
 
     auto table_id = getStorageID();
+
+    const auto & query_settings = local_context->getSettingsRef();
+    if (query_settings.max_partition_size_to_drop.changed)
+    {
+        getContext()->checkPartitionCanBeDropped(table_id.database_name, table_id.table_name, partition_size, query_settings.max_partition_size_to_drop);
+        return;
+    }
+
     getContext()->checkPartitionCanBeDropped(table_id.database_name, table_id.table_name, partition_size);
 }
 
-void MergeTreeData::checkPartCanBeDropped(const String & part_name)
+void MergeTreeData::checkPartCanBeDropped(const String & part_name, ContextPtr local_context)
 {
     if (!supportsReplication() && isStaticStorage())
         return;
@@ -4841,6 +4917,14 @@ void MergeTreeData::checkPartCanBeDropped(const String & part_name)
         throw Exception(ErrorCodes::NO_SUCH_DATA_PART, "No part {} in committed state", part_name);
 
     auto table_id = getStorageID();
+
+    const auto & query_settings = local_context->getSettingsRef();
+    if (query_settings.max_partition_size_to_drop.changed)
+    {
+        getContext()->checkPartitionCanBeDropped(table_id.database_name, table_id.table_name, part->getBytesOnDisk(), query_settings.max_partition_size_to_drop);
+        return;
+    }
+
     getContext()->checkPartitionCanBeDropped(table_id.database_name, table_id.table_name, part->getBytesOnDisk());
 }
 
@@ -5028,7 +5112,7 @@ Pipe MergeTreeData::alterPartition(
                 if (command.part)
                 {
                     auto part_name = command.partition->as<ASTLiteral &>().value.safeGet<String>();
-                    checkPartCanBeDropped(part_name);
+                    checkPartCanBeDropped(part_name, query_context);
                     dropPart(part_name, command.detach, query_context);
                 }
                 else
@@ -6317,6 +6401,24 @@ MergeTreeData::Transaction::Transaction(MergeTreeData & data_, MergeTreeTransact
         data.transactions_enabled.store(true);
 }
 
+void MergeTreeData::Transaction::rollbackPartsToTemporaryState()
+{
+    if (!isEmpty())
+    {
+        WriteBufferFromOwnString buf;
+        buf << " Rollbacking parts state to temporary and removing from working set:";
+        for (const auto & part : precommitted_parts)
+            buf << " " << part->getDataPartStorage().getPartDirectory();
+        buf << ".";
+        LOG_DEBUG(data.log, "Undoing transaction.{}", buf.str());
+
+        data.removePartsFromWorkingSetImmediatelyAndSetTemporaryState(
+            DataPartsVector(precommitted_parts.begin(), precommitted_parts.end()));
+    }
+
+    clear();
+}
+
 TransactionID MergeTreeData::Transaction::getTID() const
 {
     if (txn)
@@ -6510,51 +6612,6 @@ bool MergeTreeData::isPrimaryOrMinMaxKeyColumnPossiblyWrappedInFunctions(
     return false;
 }
 
-bool MergeTreeData::mayBenefitFromIndexForIn(
-    const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & metadata_snapshot) const
-{
-    /// Make sure that the left side of the IN operator contain part of the key.
-    /// If there is a tuple on the left side of the IN operator, at least one item of the tuple
-    /// must be part of the key (probably wrapped by a chain of some acceptable functions).
-    const auto * left_in_operand_tuple = left_in_operand->as<ASTFunction>();
-    const auto & index_factory = MergeTreeIndexFactory::instance();
-    const auto & query_settings = query_context->getSettingsRef();
-
-    auto check_for_one_argument = [&](const auto & ast)
-    {
-        if (isPrimaryOrMinMaxKeyColumnPossiblyWrappedInFunctions(ast, metadata_snapshot))
-            return true;
-
-        if (query_settings.use_skip_indexes)
-        {
-            for (const auto & index : metadata_snapshot->getSecondaryIndices())
-                if (index_factory.get(index)->mayBenefitFromIndexForIn(ast))
-                    return true;
-        }
-
-        if (query_settings.optimize_use_projections)
-        {
-            for (const auto & projection : metadata_snapshot->getProjections())
-                if (projection.isPrimaryKeyColumnPossiblyWrappedInFunctions(ast))
-                    return true;
-        }
-
-        return false;
-    };
-
-    if (left_in_operand_tuple && left_in_operand_tuple->name == "tuple")
-    {
-        for (const auto & item : left_in_operand_tuple->arguments->children)
-            if (check_for_one_argument(item))
-                return true;
-
-        /// The tuple itself may be part of the primary key
-        /// or skip index, so check that as a last resort.
-    }
-
-    return check_for_one_argument(left_in_operand);
-}
-
 using PartitionIdToMaxBlock = std::unordered_map<String, Int64>;
 
 Block MergeTreeData::getMinMaxCountProjectionBlock(
@@ -7262,6 +7319,8 @@ PartitionCommandsResultInfo MergeTreeData::freezePartitionsByMatcher(
     const String & with_name,
     ContextPtr local_context)
 {
+    auto settings = getSettings();
+
     String clickhouse_path = fs::canonical(local_context->getPath());
     String default_shadow_path = fs::path(clickhouse_path) / "shadow/";
     fs::create_directories(default_shadow_path);
@@ -7272,6 +7331,20 @@ PartitionCommandsResultInfo MergeTreeData::freezePartitionsByMatcher(
     /// Acquire a snapshot of active data parts to prevent removing while doing backup.
     const auto data_parts = getVisibleDataPartsVector(local_context);
 
+    bool has_zero_copy_part = false;
+    for (const auto & part : data_parts)
+    {
+        if (part->isStoredOnRemoteDiskWithZeroCopySupport())
+        {
+            has_zero_copy_part = true;
+            break;
+        }
+    }
+
+    if (supportsReplication() && settings->disable_freeze_partition_for_zero_copy_replication
+        && settings->allow_remote_fs_zero_copy_replication && has_zero_copy_part)
+        throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "FREEZE PARTITION queries are disabled.");
+
     String backup_name = (!with_name.empty() ? escapeForFileName(with_name) : toString(increment));
     String backup_path = fs::path(shadow_path) / backup_name / "";
 
@@ -7452,6 +7525,7 @@ try
         part_log_elem.disk_name = result_part->getDataPartStorage().getDiskName();
         part_log_elem.path_on_disk = result_part->getDataPartStorage().getFullPath();
         part_log_elem.bytes_compressed_on_disk = result_part->getBytesOnDisk();
+        part_log_elem.bytes_uncompressed = result_part->getBytesUncompressedOnDisk();
         part_log_elem.rows = result_part->rows_count;
         part_log_elem.part_type = result_part->getType();
     }
@@ -7466,7 +7540,6 @@ try
         part_log_elem.bytes_read_uncompressed = (*merge_entry)->bytes_read_uncompressed;
 
         part_log_elem.rows = (*merge_entry)->rows_written;
-        part_log_elem.bytes_uncompressed = (*merge_entry)->bytes_written_uncompressed;
         part_log_elem.peak_memory_usage = (*merge_entry)->getMemoryTracker().getPeak();
     }
 
diff --git a/src/Storages/MergeTree/MergeTreeData.h b/src/Storages/MergeTree/MergeTreeData.h
index b3dd895d697..dfa13eca11d 100644
--- a/src/Storages/MergeTree/MergeTreeData.h
+++ b/src/Storages/MergeTree/MergeTreeData.h
@@ -260,6 +260,10 @@ public:
 
         void rollback(DataPartsLock * lock = nullptr);
 
+        /// Immediately remove parts from table's data_parts set and change part
+        /// state to temporary. Useful for new parts which not present in table.
+        void rollbackPartsToTemporaryState();
+
         size_t size() const { return precommitted_parts.size(); }
         bool isEmpty() const { return precommitted_parts.empty(); }
 
@@ -442,8 +446,6 @@ public:
 
     NamesAndTypesList getVirtuals() const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & left_in_operand, ContextPtr, const StorageMetadataPtr & metadata_snapshot) const override;
-
     /// Snapshot for MergeTree contains the current set of data parts
     /// at the moment of the start of query.
     struct SnapshotData : public StorageSnapshot::Data
@@ -597,6 +599,11 @@ public:
         DataPartsLock & lock,
         DataPartsVector * out_covered_parts = nullptr);
 
+    /// Remove parts from working set immediately (without wait for background
+    /// process). Transfer part state to temporary. Have very limited usage only
+    /// for new parts which aren't already present in table.
+    void removePartsFromWorkingSetImmediatelyAndSetTemporaryState(const DataPartsVector & remove);
+
     /// Removes parts from the working set parts.
     /// Parts in add must already be in data_parts with PreActive, Active, or Outdated states.
     /// If clear_without_timeout is true, the parts will be deleted at once, or during the next call to
@@ -789,7 +796,7 @@ public:
     /// We do not use mutex because it is not very important that the size could change during the operation.
     void checkPartitionCanBeDropped(const ASTPtr & partition, ContextPtr local_context);
 
-    void checkPartCanBeDropped(const String & part_name);
+    void checkPartCanBeDropped(const String & part_name, ContextPtr local_context);
 
     Pipe alterPartition(
         const StorageMetadataPtr & metadata_snapshot,
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
index 4bda5ce469d..aa1968794f9 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.cpp
@@ -112,6 +112,14 @@ UInt64 MergeTreeDataPartChecksums::getTotalSizeOnDisk() const
     return res;
 }
 
+UInt64 MergeTreeDataPartChecksums::getTotalSizeUncompressedOnDisk() const
+{
+    UInt64 res = 0;
+    for (const auto & [_, checksum] : files)
+        res += checksum.uncompressed_size;
+    return res;
+}
+
 bool MergeTreeDataPartChecksums::read(ReadBuffer & in, size_t format_version)
 {
     switch (format_version)
diff --git a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
index 8e5e8c8c448..837b940e354 100644
--- a/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
+++ b/src/Storages/MergeTree/MergeTreeDataPartChecksum.h
@@ -88,6 +88,7 @@ struct MergeTreeDataPartChecksums
     static MergeTreeDataPartChecksums deserializeFrom(const String & s);
 
     UInt64 getTotalSizeOnDisk() const;
+    UInt64 getTotalSizeUncompressedOnDisk() const;
 };
 
 /// A kind of MergeTreeDataPartChecksums intended to be stored in ZooKeeper (to save its RAM)
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
index 8485f3f3e1d..7b30622a4fc 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.cpp
@@ -92,7 +92,7 @@ size_t MergeTreeDataSelectExecutor::getApproximateTotalRowsToRead(
 
     for (const auto & part : parts)
     {
-        MarkRanges ranges = markRangesFromPKRange(part, metadata_snapshot, key_condition, settings, log);
+        MarkRanges ranges = markRangesFromPKRange(part, metadata_snapshot, key_condition, {}, settings, log);
 
         /** In order to get a lower bound on the number of rows that match the condition on PK,
           *  consider only guaranteed full marks.
@@ -325,7 +325,9 @@ QueryPlanPtr MergeTreeDataSelectExecutor::read(
                 settings.max_block_size,
                 settings.enable_software_prefetch_in_aggregation,
                 only_merge,
-                settings.optimize_group_by_constant_keys);
+                settings.optimize_group_by_constant_keys,
+                settings.min_hit_rate_to_use_consecutive_keys_optimization,
+                /*stats_collecting_params=*/ {});
 
             return std::make_pair(params, only_merge);
         };
@@ -770,6 +772,35 @@ MergeTreeDataSelectSamplingData MergeTreeDataSelectExecutor::getSampling(
     return sampling;
 }
 
+void MergeTreeDataSelectExecutor::buildKeyConditionFromPartOffset(
+    std::optional<KeyCondition> & part_offset_condition, const ActionsDAGPtr & filter_dag, ContextPtr context)
+{
+    if (!filter_dag)
+        return;
+
+    auto part_offset_type = std::make_shared<DataTypeUInt64>();
+    auto part_type = std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>());
+    Block sample
+        = {ColumnWithTypeAndName(part_offset_type->createColumn(), part_offset_type, "_part_offset"),
+           ColumnWithTypeAndName(part_type->createColumn(), part_type, "_part")};
+
+    auto dag = VirtualColumnUtils::splitFilterDagForAllowedInputs(filter_dag->getOutputs().at(0), sample);
+    if (!dag)
+        return;
+
+    /// The _part filter should only be effective in conjunction with the _part_offset filter.
+    auto required_columns = dag->getRequiredColumnsNames();
+    if (std::find(required_columns.begin(), required_columns.end(), "_part_offset") == required_columns.end())
+        return;
+
+    part_offset_condition.emplace(KeyCondition{
+        dag,
+        context,
+        sample.getNames(),
+        std::make_shared<ExpressionActions>(std::make_shared<ActionsDAG>(sample.getColumnsWithTypeAndName()), ExpressionActionsSettings{}),
+        {}});
+}
+
 std::optional<std::unordered_set<String>> MergeTreeDataSelectExecutor::filterPartsByVirtualColumns(
     const MergeTreeData & data,
     const MergeTreeData::DataPartsVector & parts,
@@ -909,6 +940,7 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
     StorageMetadataPtr metadata_snapshot,
     const ContextPtr & context,
     const KeyCondition & key_condition,
+    const std::optional<KeyCondition> & part_offset_condition,
     const UsefulSkipIndexes & skip_indexes,
     const MergeTreeReaderSettings & reader_settings,
     Poco::Logger * log,
@@ -928,7 +960,7 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
 
         Strings forced_indices;
         {
-            Tokens tokens(indices.data(), &indices[indices.size()], settings.max_query_size);
+            Tokens tokens(indices.data(), indices.data() + indices.size(), settings.max_query_size);
             IParser::Pos pos(tokens, static_cast<unsigned>(settings.max_parser_depth));
             Expected expected;
             if (!parseIdentifiersOrStringLiterals(pos, expected, forced_indices))
@@ -983,8 +1015,8 @@ RangesInDataParts MergeTreeDataSelectExecutor::filterPartsByPrimaryKeyAndSkipInd
             RangesInDataPart ranges(part, alter_conversions_for_part, part_index);
             size_t total_marks_count = part->index_granularity.getMarksCountWithoutFinal();
 
-            if (metadata_snapshot->hasPrimaryKey())
-                ranges.ranges = markRangesFromPKRange(part, metadata_snapshot, key_condition, settings, log);
+            if (metadata_snapshot->hasPrimaryKey() || part_offset_condition)
+                ranges.ranges = markRangesFromPKRange(part, metadata_snapshot, key_condition, part_offset_condition, settings, log);
             else if (total_marks_count)
                 ranges.ranges = MarkRanges{{MarkRange{0, total_marks_count}}};
 
@@ -1404,6 +1436,7 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
     const MergeTreeData::DataPartPtr & part,
     const StorageMetadataPtr & metadata_snapshot,
     const KeyCondition & key_condition,
+    const std::optional<KeyCondition> & part_offset_condition,
     const Settings & settings,
     Poco::Logger * log)
 {
@@ -1417,7 +1450,7 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
     bool has_final_mark = part->index_granularity.hasFinalMark();
 
     /// If index is not used.
-    if (key_condition.alwaysUnknownOrTrue())
+    if (key_condition.alwaysUnknownOrTrue() && (!part_offset_condition || part_offset_condition->alwaysUnknownOrTrue()))
     {
         if (has_final_mark)
             res.push_back(MarkRange(0, marks_count - 1));
@@ -1467,32 +1500,69 @@ MarkRanges MergeTreeDataSelectExecutor::markRangesFromPKRange(
     std::vector<FieldRef> index_left(used_key_size);
     std::vector<FieldRef> index_right(used_key_size);
 
+    /// For _part_offset and _part virtual columns
+    DataTypes part_offset_types
+        = {std::make_shared<DataTypeUInt64>(), std::make_shared<DataTypeLowCardinality>(std::make_shared<DataTypeString>())};
+    std::vector<FieldRef> part_offset_left(2);
+    std::vector<FieldRef> part_offset_right(2);
+
     auto may_be_true_in_range = [&](MarkRange & range)
     {
-        if (range.end == marks_count && !has_final_mark)
+        bool key_condition_maybe_true = true;
+        if (!key_condition.alwaysUnknownOrTrue())
         {
-            for (size_t i = 0; i < used_key_size; ++i)
+            if (range.end == marks_count && !has_final_mark)
             {
-                create_field_ref(range.begin, i, index_left[i]);
-                index_right[i] = POSITIVE_INFINITY;
+                for (size_t i = 0; i < used_key_size; ++i)
+                {
+                    create_field_ref(range.begin, i, index_left[i]);
+                    index_right[i] = POSITIVE_INFINITY;
+                }
             }
-        }
-        else
-        {
-            if (has_final_mark && range.end == marks_count)
-                range.end -= 1; /// Remove final empty mark. It's useful only for primary key condition.
+            else
+            {
+                if (has_final_mark && range.end == marks_count)
+                    range.end -= 1; /// Remove final empty mark. It's useful only for primary key condition.
 
-            for (size_t i = 0; i < used_key_size; ++i)
+                for (size_t i = 0; i < used_key_size; ++i)
+                {
+                    create_field_ref(range.begin, i, index_left[i]);
+                    create_field_ref(range.end, i, index_right[i]);
+                }
+            }
+            key_condition_maybe_true = key_condition.mayBeTrueInRange(used_key_size, index_left.data(), index_right.data(), key_types);
+        }
+
+        bool part_offset_condition_maybe_true = true;
+
+        if (part_offset_condition && !part_offset_condition->alwaysUnknownOrTrue())
+        {
+            auto begin = part->index_granularity.getMarkStartingRow(range.begin);
+            auto end = part->index_granularity.getMarkStartingRow(range.end) - 1;
+            if (begin > end)
             {
-                create_field_ref(range.begin, i, index_left[i]);
-                create_field_ref(range.end, i, index_right[i]);
+                /// Empty mark (final mark)
+                part_offset_condition_maybe_true = false;
+            }
+            else
+            {
+                part_offset_left[0] = part->index_granularity.getMarkStartingRow(range.begin);
+                part_offset_right[0] = part->index_granularity.getMarkStartingRow(range.end) - 1;
+                part_offset_left[1] = part->name;
+                part_offset_right[1] = part->name;
+
+                part_offset_condition_maybe_true
+                    = part_offset_condition->mayBeTrueInRange(2, part_offset_left.data(), part_offset_right.data(), part_offset_types);
             }
         }
-        return key_condition.mayBeTrueInRange(used_key_size, index_left.data(), index_right.data(), key_types);
+        return key_condition_maybe_true && part_offset_condition_maybe_true;
     };
 
+    bool key_condition_exact_range = key_condition.alwaysUnknownOrTrue() || key_condition.matchesExactContinuousRange();
+    bool part_offset_condition_exact_range
+        = !part_offset_condition || part_offset_condition->alwaysUnknownOrTrue() || part_offset_condition->matchesExactContinuousRange();
     const String & part_name = part->isProjectionPart() ? fmt::format("{}.{}", part->name, part->getParentPart()->name) : part->name;
-    if (!key_condition.matchesExactContinuousRange())
+    if (!key_condition_exact_range || !part_offset_condition_exact_range)
     {
         // Do exclusion search, where we drop ranges that do not match
 
diff --git a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h
index 01c2da9dd63..11c8e172a4f 100644
--- a/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h
+++ b/src/Storages/MergeTree/MergeTreeDataSelectExecutor.h
@@ -71,6 +71,7 @@ public:
         const MergeTreeData::DataPartPtr & part,
         const StorageMetadataPtr & metadata_snapshot,
         const KeyCondition & key_condition,
+        const std::optional<KeyCondition> & part_offset_condition,
         const Settings & settings,
         Poco::Logger * log);
 
@@ -161,6 +162,10 @@ public:
         size_t bytes_granularity,
         size_t max_marks);
 
+    /// If possible, construct optional key condition from predicates containing _part_offset column.
+    static void buildKeyConditionFromPartOffset(
+        std::optional<KeyCondition> & part_offset_condition, const ActionsDAGPtr & filter_dag, ContextPtr context);
+
     /// If possible, filter using expression on virtual columns.
     /// Example: SELECT count() FROM table WHERE _part = 'part_name'
     /// If expression found, return a set with allowed part names (std::nullopt otherwise).
@@ -199,6 +204,7 @@ public:
         StorageMetadataPtr metadata_snapshot,
         const ContextPtr & context,
         const KeyCondition & key_condition,
+        const std::optional<KeyCondition> & part_offset_condition,
         const UsefulSkipIndexes & skip_indexes,
         const MergeTreeReaderSettings & reader_settings,
         Poco::Logger * log,
diff --git a/src/Storages/MergeTree/MergeTreeIndexAnnoy.h b/src/Storages/MergeTree/MergeTreeIndexAnnoy.h
index 1e753fd9bc4..dead12fe66f 100644
--- a/src/Storages/MergeTree/MergeTreeIndexAnnoy.h
+++ b/src/Storages/MergeTree/MergeTreeIndexAnnoy.h
@@ -100,8 +100,6 @@ public:
     MergeTreeIndexAggregatorPtr createIndexAggregator(const MergeTreeWriterSettings & settings) const override;
     MergeTreeIndexConditionPtr createIndexCondition(const SelectQueryInfo & query, ContextPtr context) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & /*node*/) const override { return false; }
-
 private:
     const UInt64 trees;
     const String distance_function;
diff --git a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
index ea3f4eac090..fa05f9e61e1 100644
--- a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.cpp
@@ -38,33 +38,6 @@ MergeTreeIndexGranulePtr MergeTreeIndexBloomFilter::createIndexGranule() const
     return std::make_shared<MergeTreeIndexGranuleBloomFilter>(bits_per_row, hash_functions, index.column_names.size());
 }
 
-bool MergeTreeIndexBloomFilter::mayBenefitFromIndexForIn(const ASTPtr & node) const
-{
-    Names required_columns = index.expression->getRequiredColumns();
-    NameSet required_columns_set(required_columns.begin(), required_columns.end());
-
-    std::vector<ASTPtr> nodes_to_check;
-    nodes_to_check.emplace_back(node);
-
-    while (!nodes_to_check.empty())
-    {
-        auto node_to_check = nodes_to_check.back();
-        nodes_to_check.pop_back();
-
-        const auto & column_name = node_to_check->getColumnName();
-        if (required_columns_set.find(column_name) != required_columns_set.end())
-            return true;
-
-        if (const auto * function = typeid_cast<const ASTFunction *>(node_to_check.get()))
-        {
-            auto & function_arguments_children = function->arguments->children;
-            nodes_to_check.insert(nodes_to_check.end(), function_arguments_children.begin(), function_arguments_children.end());
-        }
-    }
-
-    return false;
-}
-
 MergeTreeIndexAggregatorPtr MergeTreeIndexBloomFilter::createIndexAggregator(const MergeTreeWriterSettings & /*settings*/) const
 {
     return std::make_shared<MergeTreeIndexAggregatorBloomFilter>(bits_per_row, hash_functions, index.column_names);
diff --git a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.h b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.h
index f60630c8056..4d688ae3cfc 100644
--- a/src/Storages/MergeTree/MergeTreeIndexBloomFilter.h
+++ b/src/Storages/MergeTree/MergeTreeIndexBloomFilter.h
@@ -22,8 +22,6 @@ public:
 
     MergeTreeIndexConditionPtr createIndexCondition(const SelectQueryInfo & query_info, ContextPtr context) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & node) const override;
-
 private:
     size_t bits_per_row;
     size_t hash_functions;
diff --git a/src/Storages/MergeTree/MergeTreeIndexFullText.cpp b/src/Storages/MergeTree/MergeTreeIndexFullText.cpp
index 7dbe7a0cbe4..6c1fff53109 100644
--- a/src/Storages/MergeTree/MergeTreeIndexFullText.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexFullText.cpp
@@ -201,6 +201,7 @@ bool MergeTreeConditionFullText::alwaysUnknownOrTrue() const
              || element.function == RPNElement::FUNCTION_IN
              || element.function == RPNElement::FUNCTION_NOT_IN
              || element.function == RPNElement::FUNCTION_MULTI_SEARCH
+             || element.function == RPNElement::FUNCTION_HAS_ANY
              || element.function == RPNElement::ALWAYS_FALSE)
         {
             rpn_stack.push_back(false);
@@ -274,7 +275,8 @@ bool MergeTreeConditionFullText::mayBeTrueOnGranule(MergeTreeIndexGranulePtr idx
             if (element.function == RPNElement::FUNCTION_NOT_IN)
                 rpn_stack.back() = !rpn_stack.back();
         }
-        else if (element.function == RPNElement::FUNCTION_MULTI_SEARCH)
+        else if (element.function == RPNElement::FUNCTION_MULTI_SEARCH
+            || element.function == RPNElement::FUNCTION_HAS_ANY)
         {
             std::vector<bool> result(element.set_bloom_filters.back().size(), true);
 
@@ -395,7 +397,8 @@ bool MergeTreeConditionFullText::extractAtomFromTree(const RPNBuilderTreeNode &
                  function_name.starts_with("hasToken") ||
                  function_name == "startsWith" ||
                  function_name == "endsWith" ||
-                 function_name == "multiSearchAny")
+                 function_name == "multiSearchAny" ||
+                 function_name == "hasAny")
         {
             Field const_value;
             DataTypePtr const_type;
@@ -574,10 +577,13 @@ bool MergeTreeConditionFullText::traverseTreeEquals(
         token_extractor->stringToBloomFilter(value.data(), value.size(), *out.bloom_filter);
         return true;
     }
-    else if (function_name == "multiSearchAny")
+    else if (function_name == "multiSearchAny"
+        || function_name == "hasAny")
     {
         out.key_column = *key_index;
-        out.function = RPNElement::FUNCTION_MULTI_SEARCH;
+        out.function = function_name == "multiSearchAny" ?
+            RPNElement::FUNCTION_MULTI_SEARCH :
+            RPNElement::FUNCTION_HAS_ANY;
 
         /// 2d vector is not needed here but is used because already exists for FUNCTION_IN
         std::vector<std::vector<BloomFilter>> bloom_filters;
@@ -690,11 +696,6 @@ MergeTreeIndexConditionPtr MergeTreeIndexFullText::createIndexCondition(
     return std::make_shared<MergeTreeConditionFullText>(query, context, index.sample_block, params, token_extractor.get());
 }
 
-bool MergeTreeIndexFullText::mayBenefitFromIndexForIn(const ASTPtr & node) const
-{
-    return std::find(std::cbegin(index.column_names), std::cend(index.column_names), node->getColumnName()) != std::cend(index.column_names);
-}
-
 MergeTreeIndexPtr bloomFilterIndexCreator(
     const IndexDescription & index)
 {
diff --git a/src/Storages/MergeTree/MergeTreeIndexFullText.h b/src/Storages/MergeTree/MergeTreeIndexFullText.h
index fbfa0fd27fc..22f9215d563 100644
--- a/src/Storages/MergeTree/MergeTreeIndexFullText.h
+++ b/src/Storages/MergeTree/MergeTreeIndexFullText.h
@@ -92,6 +92,7 @@ private:
             FUNCTION_IN,
             FUNCTION_NOT_IN,
             FUNCTION_MULTI_SEARCH,
+            FUNCTION_HAS_ANY,
             FUNCTION_UNKNOWN, /// Can take any value.
             /// Operators of the logical expression.
             FUNCTION_NOT,
@@ -107,13 +108,13 @@ private:
                 : function(function_), key_column(key_column_), bloom_filter(std::move(const_bloom_filter_)) {}
 
         Function function = FUNCTION_UNKNOWN;
-        /// For FUNCTION_EQUALS, FUNCTION_NOT_EQUALS and FUNCTION_MULTI_SEARCH
+        /// For FUNCTION_EQUALS, FUNCTION_NOT_EQUALS, FUNCTION_MULTI_SEARCH and FUNCTION_HAS_ANY
         size_t key_column;
 
         /// For FUNCTION_EQUALS, FUNCTION_NOT_EQUALS
         std::unique_ptr<BloomFilter> bloom_filter;
 
-        /// For FUNCTION_IN, FUNCTION_NOT_IN and FUNCTION_MULTI_SEARCH
+        /// For FUNCTION_IN, FUNCTION_NOT_IN, FUNCTION_MULTI_SEARCH and FUNCTION_HAS_ANY
         std::vector<std::vector<BloomFilter>> set_bloom_filters;
 
         /// For FUNCTION_IN and FUNCTION_NOT_IN
@@ -166,8 +167,6 @@ public:
     MergeTreeIndexConditionPtr createIndexCondition(
             const SelectQueryInfo & query, ContextPtr context) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & node) const override;
-
     BloomFilterParameters params;
     /// Function for selecting next token.
     std::unique_ptr<ITokenExtractor> token_extractor;
diff --git a/src/Storages/MergeTree/MergeTreeIndexHypothesis.cpp b/src/Storages/MergeTree/MergeTreeIndexHypothesis.cpp
index f5136cc3764..818bae40067 100644
--- a/src/Storages/MergeTree/MergeTreeIndexHypothesis.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexHypothesis.cpp
@@ -91,11 +91,6 @@ MergeTreeIndexMergedConditionPtr MergeTreeIndexHypothesis::createIndexMergedCond
         query_info, storage_metadata->getConstraints(), index.granularity);
 }
 
-bool MergeTreeIndexHypothesis::mayBenefitFromIndexForIn(const ASTPtr &) const
-{
-    return false;
-}
-
 MergeTreeIndexPtr hypothesisIndexCreator(const IndexDescription & index)
 {
     return std::make_shared<MergeTreeIndexHypothesis>(index);
diff --git a/src/Storages/MergeTree/MergeTreeIndexHypothesis.h b/src/Storages/MergeTree/MergeTreeIndexHypothesis.h
index e138559a1d0..1cd0e3daf27 100644
--- a/src/Storages/MergeTree/MergeTreeIndexHypothesis.h
+++ b/src/Storages/MergeTree/MergeTreeIndexHypothesis.h
@@ -75,8 +75,6 @@ public:
     MergeTreeIndexMergedConditionPtr createIndexMergedCondition(
         const SelectQueryInfo & query_info, StorageMetadataPtr storage_metadata) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & node) const override;
-
     size_t max_rows = 0;
 };
 
diff --git a/src/Storages/MergeTree/MergeTreeIndexInverted.cpp b/src/Storages/MergeTree/MergeTreeIndexInverted.cpp
index 908fc98728e..5e2a034cb97 100644
--- a/src/Storages/MergeTree/MergeTreeIndexInverted.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexInverted.cpp
@@ -726,11 +726,6 @@ MergeTreeIndexConditionPtr MergeTreeIndexInverted::createIndexCondition(
     return std::make_shared<MergeTreeConditionInverted>(query, context, index.sample_block, params, token_extractor.get());
 };
 
-bool MergeTreeIndexInverted::mayBenefitFromIndexForIn(const ASTPtr & node) const
-{
-    return std::find(std::cbegin(index.column_names), std::cend(index.column_names), node->getColumnName()) != std::cend(index.column_names);
-}
-
 MergeTreeIndexPtr invertedIndexCreator(
     const IndexDescription & index)
 {
diff --git a/src/Storages/MergeTree/MergeTreeIndexInverted.h b/src/Storages/MergeTree/MergeTreeIndexInverted.h
index 86bf7613646..413cf206f0e 100644
--- a/src/Storages/MergeTree/MergeTreeIndexInverted.h
+++ b/src/Storages/MergeTree/MergeTreeIndexInverted.h
@@ -171,8 +171,6 @@ public:
     MergeTreeIndexAggregatorPtr createIndexAggregatorForPart(const GinIndexStorePtr & store, const MergeTreeWriterSettings & /*settings*/) const override;
     MergeTreeIndexConditionPtr createIndexCondition(const SelectQueryInfo & query, ContextPtr context) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & node) const override;
-
     GinFilterParameters params;
     /// Function for selecting next token.
     std::unique_ptr<ITokenExtractor> token_extractor;
diff --git a/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp b/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
index 35c52d6cd5e..535fef45872 100644
--- a/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexMinMax.cpp
@@ -159,13 +159,7 @@ namespace
 KeyCondition buildCondition(const IndexDescription & index, const SelectQueryInfo & query_info, ContextPtr context)
 {
     if (context->getSettingsRef().allow_experimental_analyzer)
-    {
-        NameSet array_join_name_set;
-        if (query_info.syntax_analyzer_result)
-            array_join_name_set = query_info.syntax_analyzer_result->getArrayJoinSourceNameSet();
-
-        return KeyCondition{query_info.filter_actions_dag, context, index.column_names, index.expression, array_join_name_set};
-    }
+        return KeyCondition{query_info.filter_actions_dag, context, index.column_names, index.expression};
 
     return KeyCondition{query_info, context, index.column_names, index.expression};
 }
@@ -211,21 +205,6 @@ MergeTreeIndexConditionPtr MergeTreeIndexMinMax::createIndexCondition(
     return std::make_shared<MergeTreeIndexConditionMinMax>(index, query, context);
 }
 
-bool MergeTreeIndexMinMax::mayBenefitFromIndexForIn(const ASTPtr & node) const
-{
-    const String column_name = node->getColumnName();
-
-    for (const auto & cname : index.column_names)
-        if (column_name == cname)
-            return true;
-
-    if (const auto * func = typeid_cast<const ASTFunction *>(node.get()))
-        if (func->arguments->children.size() == 1)
-            return mayBenefitFromIndexForIn(func->arguments->children.front());
-
-    return false;
-}
-
 MergeTreeIndexFormat MergeTreeIndexMinMax::getDeserializedFormat(const IDataPartStorage & data_part_storage, const std::string & relative_path_prefix) const
 {
     if (data_part_storage.exists(relative_path_prefix + ".idx2"))
diff --git a/src/Storages/MergeTree/MergeTreeIndexMinMax.h b/src/Storages/MergeTree/MergeTreeIndexMinMax.h
index 4517a195362..a1a216fdf72 100644
--- a/src/Storages/MergeTree/MergeTreeIndexMinMax.h
+++ b/src/Storages/MergeTree/MergeTreeIndexMinMax.h
@@ -81,8 +81,6 @@ public:
     MergeTreeIndexConditionPtr createIndexCondition(
         const SelectQueryInfo & query, ContextPtr context) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & node) const override;
-
     const char* getSerializedFileExtension() const override { return ".idx2"; }
     MergeTreeIndexFormat getDeserializedFormat(const IDataPartStorage & data_part_storage, const std::string & path_prefix) const override; /// NOLINT
 };
diff --git a/src/Storages/MergeTree/MergeTreeIndexSet.cpp b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
index ec02d9418a7..612c5d868cb 100644
--- a/src/Storages/MergeTree/MergeTreeIndexSet.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexSet.cpp
@@ -709,11 +709,6 @@ MergeTreeIndexConditionPtr MergeTreeIndexSet::createIndexCondition(
     return std::make_shared<MergeTreeIndexConditionSet>(index.name, index.sample_block, max_rows, query, context);
 }
 
-bool MergeTreeIndexSet::mayBenefitFromIndexForIn(const ASTPtr &) const
-{
-    return false;
-}
-
 MergeTreeIndexPtr setIndexCreator(const IndexDescription & index)
 {
     size_t max_rows = index.arguments[0].get<size_t>();
diff --git a/src/Storages/MergeTree/MergeTreeIndexSet.h b/src/Storages/MergeTree/MergeTreeIndexSet.h
index 022988c2453..a53476ca751 100644
--- a/src/Storages/MergeTree/MergeTreeIndexSet.h
+++ b/src/Storages/MergeTree/MergeTreeIndexSet.h
@@ -151,8 +151,6 @@ public:
     MergeTreeIndexConditionPtr createIndexCondition(
             const SelectQueryInfo & query, ContextPtr context) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & node) const override;
-
     size_t max_rows = 0;
 };
 
diff --git a/src/Storages/MergeTree/MergeTreeIndexUSearch.cpp b/src/Storages/MergeTree/MergeTreeIndexUSearch.cpp
index a889e58bfec..dc8ed368011 100644
--- a/src/Storages/MergeTree/MergeTreeIndexUSearch.cpp
+++ b/src/Storages/MergeTree/MergeTreeIndexUSearch.cpp
@@ -212,7 +212,7 @@ void MergeTreeIndexAggregatorUSearch<Metric>::update(const Block & block, size_t
         {
             auto rc = index->add(static_cast<uint32_t>(index->size()), &column_array_data_float_data[column_array_offsets[current_row - 1]]);
             if (!rc)
-                throw Exception(ErrorCodes::INCORRECT_DATA, rc.error.release());
+                throw Exception::createRuntime(ErrorCodes::INCORRECT_DATA, rc.error.release());
 
             ProfileEvents::increment(ProfileEvents::USearchAddCount);
             ProfileEvents::increment(ProfileEvents::USearchAddVisitedMembers, rc.visited_members);
@@ -243,7 +243,7 @@ void MergeTreeIndexAggregatorUSearch<Metric>::update(const Block & block, size_t
         {
             auto rc = index->add(static_cast<uint32_t>(index->size()), item.data());
             if (!rc)
-                throw Exception(ErrorCodes::INCORRECT_DATA, rc.error.release());
+                throw Exception::createRuntime(ErrorCodes::INCORRECT_DATA, rc.error.release());
 
             ProfileEvents::increment(ProfileEvents::USearchAddCount);
             ProfileEvents::increment(ProfileEvents::USearchAddVisitedMembers, rc.visited_members);
diff --git a/src/Storages/MergeTree/MergeTreeIndexUSearch.h b/src/Storages/MergeTree/MergeTreeIndexUSearch.h
index bf58928a577..a7675620a2e 100644
--- a/src/Storages/MergeTree/MergeTreeIndexUSearch.h
+++ b/src/Storages/MergeTree/MergeTreeIndexUSearch.h
@@ -102,8 +102,6 @@ public:
     MergeTreeIndexAggregatorPtr createIndexAggregator(const MergeTreeWriterSettings & settings) const override;
     MergeTreeIndexConditionPtr createIndexCondition(const SelectQueryInfo & query, ContextPtr context) const override;
 
-    bool mayBenefitFromIndexForIn(const ASTPtr & /*node*/) const override { return false; }
-
 private:
     const String distance_function;
     const unum::usearch::scalar_kind_t scalar_kind;
diff --git a/src/Storages/MergeTree/MergeTreeIndices.h b/src/Storages/MergeTree/MergeTreeIndices.h
index 77062f09be9..da1e914b90e 100644
--- a/src/Storages/MergeTree/MergeTreeIndices.h
+++ b/src/Storages/MergeTree/MergeTreeIndices.h
@@ -160,9 +160,6 @@ struct IMergeTreeIndex
         return {0 /*unknown*/, ""};
     }
 
-    /// Checks whether the column is in data skipping index.
-    virtual bool mayBenefitFromIndexForIn(const ASTPtr & node) const = 0;
-
     virtual MergeTreeIndexGranulePtr createIndexGranule() const = 0;
 
     virtual MergeTreeIndexAggregatorPtr createIndexAggregator(const MergeTreeWriterSettings & settings) const = 0;
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
index 9713cc8b890..02048009296 100644
--- a/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
+++ b/src/Storages/MergeTree/MergeTreeReaderCompact.cpp
@@ -216,6 +216,10 @@ size_t MergeTreeReaderCompact::readRows(
     {
         size_t rows_to_read = data_part_info_for_read->getIndexGranularity().getMarkRows(from_mark);
 
+        /// If we need to read multiple subcolumns from a single column in storage,
+        /// we will read it this column only once and then reuse to extract all subcolumns.
+        std::unordered_map<String, ColumnPtr> columns_cache_for_subcolumns;
+
         for (size_t pos = 0; pos < num_columns; ++pos)
         {
             if (!res_columns[pos])
@@ -226,7 +230,7 @@ size_t MergeTreeReaderCompact::readRows(
                 auto & column = res_columns[pos];
                 size_t column_size_before_reading = column->size();
 
-                readData(columns_to_read[pos], column, from_mark, current_task_last_mark, *column_positions[pos], rows_to_read, columns_for_offsets[pos]);
+                readData(columns_to_read[pos], column, from_mark, current_task_last_mark, *column_positions[pos], rows_to_read, columns_for_offsets[pos], columns_cache_for_subcolumns);
 
                 size_t read_rows_in_column = column->size() - column_size_before_reading;
                 if (read_rows_in_column != rows_to_read)
@@ -265,7 +269,7 @@ size_t MergeTreeReaderCompact::readRows(
 void MergeTreeReaderCompact::readData(
     const NameAndTypePair & name_and_type, ColumnPtr & column,
     size_t from_mark, size_t current_task_last_mark, size_t column_position, size_t rows_to_read,
-    ColumnNameLevel name_level_for_offsets)
+    ColumnNameLevel name_level_for_offsets, std::unordered_map<String, ColumnPtr> & columns_cache_for_subcolumns)
 {
     const auto & [name, type] = name_and_type;
     std::optional<NameAndTypePair> column_for_offsets;
@@ -327,34 +331,54 @@ void MergeTreeReaderCompact::readData(
 
     ISerialization::DeserializeBinaryBulkSettings deserialize_settings;
     deserialize_settings.avg_value_size_hint = avg_value_size_hints[name];
+    bool columns_cache_was_used = false;
 
     if (name_and_type.isSubcolumn())
     {
         NameAndTypePair name_type_in_storage{name_and_type.getNameInStorage(), name_and_type.getTypeInStorage()};
+        ColumnPtr temp_column;
 
-        /// In case of reading onlys offset use the correct serialization for reading of the prefix
-        auto serialization = getSerializationInPart(name_type_in_storage);
-        ColumnPtr temp_column = name_type_in_storage.type->createColumn(*serialization);
-
-        if (column_for_offsets)
+        auto it = columns_cache_for_subcolumns.find(name_type_in_storage.name);
+        if (!column_for_offsets && it != columns_cache_for_subcolumns.end())
         {
-            auto serialization_for_prefix = getSerializationInPart(*column_for_offsets);
+            temp_column = it->second;
+            auto subcolumn = name_type_in_storage.type->getSubcolumn(name_and_type.getSubcolumnName(), temp_column);
+            if (column->empty())
+                column = IColumn::mutate(subcolumn);
+            else
+                column->assumeMutable()->insertRangeFrom(*subcolumn, 0, subcolumn->size());
 
-            deserialize_settings.getter = buffer_getter_for_prefix;
-            serialization_for_prefix->deserializeBinaryBulkStatePrefix(deserialize_settings, state_for_prefix);
+            columns_cache_was_used = true;
         }
-
-        deserialize_settings.getter = buffer_getter;
-        serialization->deserializeBinaryBulkStatePrefix(deserialize_settings, state);
-        serialization->deserializeBinaryBulkWithMultipleStreams(temp_column, rows_to_read, deserialize_settings, state, nullptr);
-
-        auto subcolumn = name_type_in_storage.type->getSubcolumn(name_and_type.getSubcolumnName(), temp_column);
-
-        /// TODO: Avoid extra copying.
-        if (column->empty())
-            column = subcolumn;
         else
-            column->assumeMutable()->insertRangeFrom(*subcolumn, 0, subcolumn->size());
+        {
+            /// In case of reading only offset use the correct serialization for reading of the prefix
+            auto serialization = getSerializationInPart(name_type_in_storage);
+            temp_column = name_type_in_storage.type->createColumn(*serialization);
+
+            if (column_for_offsets)
+            {
+                auto serialization_for_prefix = getSerializationInPart(*column_for_offsets);
+
+                deserialize_settings.getter = buffer_getter_for_prefix;
+                serialization_for_prefix->deserializeBinaryBulkStatePrefix(deserialize_settings, state_for_prefix);
+            }
+
+            deserialize_settings.getter = buffer_getter;
+            serialization->deserializeBinaryBulkStatePrefix(deserialize_settings, state);
+            serialization->deserializeBinaryBulkWithMultipleStreams(temp_column, rows_to_read, deserialize_settings, state, nullptr);
+
+            if (!column_for_offsets)
+                columns_cache_for_subcolumns[name_type_in_storage.name] = temp_column;
+
+            auto subcolumn = name_type_in_storage.type->getSubcolumn(name_and_type.getSubcolumnName(), temp_column);
+
+            /// TODO: Avoid extra copying.
+            if (column->empty())
+                column = subcolumn;
+            else
+                column->assumeMutable()->insertRangeFrom(*subcolumn, 0, subcolumn->size());
+        }
     }
     else
     {
@@ -374,8 +398,8 @@ void MergeTreeReaderCompact::readData(
         serialization->deserializeBinaryBulkWithMultipleStreams(column, rows_to_read, deserialize_settings, state, nullptr);
     }
 
-    /// The buffer is left in inconsistent state after reading single offsets
-    if (name_level_for_offsets.has_value())
+    /// The buffer is left in inconsistent state after reading single offsets or using columns cache during subcolumns reading.
+    if (name_level_for_offsets.has_value() || columns_cache_was_used)
         last_read_granule.reset();
     else
         last_read_granule.emplace(from_mark, column_position);
diff --git a/src/Storages/MergeTree/MergeTreeReaderCompact.h b/src/Storages/MergeTree/MergeTreeReaderCompact.h
index cf706526363..dace4ec468e 100644
--- a/src/Storages/MergeTree/MergeTreeReaderCompact.h
+++ b/src/Storages/MergeTree/MergeTreeReaderCompact.h
@@ -76,7 +76,7 @@ private:
 
     void readData(const NameAndTypePair & name_and_type, ColumnPtr & column, size_t from_mark,
         size_t current_task_last_mark, size_t column_position,
-        size_t rows_to_read, ColumnNameLevel name_level_for_offsets);
+        size_t rows_to_read, ColumnNameLevel name_level_for_offsets, std::unordered_map<String, ColumnPtr> & columns_cache_for_subcolumns);
 
     /// Returns maximal value of granule size in compressed file from @mark_ranges.
     /// This value is used as size of read buffer.
diff --git a/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp b/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp
index 9b480ac27a0..aeff438f509 100644
--- a/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp
+++ b/src/Storages/MergeTree/MergeTreeSelectProcessor.cpp
@@ -6,8 +6,10 @@
 #include <Common/ElapsedTimeProfileEventIncrement.h>
 #include <Common/logger_useful.h>
 #include <Common/typeid_cast.h>
+#include <Processors/Merges/Algorithms/MergeTreePartLevelInfo.h>
 #include <DataTypes/DataTypeUUID.h>
 #include <DataTypes/DataTypeArray.h>
+#include <Processors/Chunk.h>
 #include <Processors/Transforms/AggregatingTransform.h>
 #include <Storages/BlockNumberColumn.h>
 #include <city.h>
@@ -173,7 +175,7 @@ ChunkAndProgress MergeTreeSelectProcessor::read()
             }
 
             return ChunkAndProgress{
-                .chunk = Chunk(ordered_columns, res.row_count),
+                .chunk = Chunk(ordered_columns, res.row_count, add_part_level ? std::make_shared<MergeTreePartLevelInfo>(task->getInfo().data_part->info.level) : nullptr),
                 .num_read_rows = res.num_read_rows,
                 .num_read_bytes = res.num_read_bytes,
                 .is_finished = false};
diff --git a/src/Storages/MergeTree/MergeTreeSelectProcessor.h b/src/Storages/MergeTree/MergeTreeSelectProcessor.h
index a5178cda55d..cf1a6313b51 100644
--- a/src/Storages/MergeTree/MergeTreeSelectProcessor.h
+++ b/src/Storages/MergeTree/MergeTreeSelectProcessor.h
@@ -69,6 +69,8 @@ public:
         const ExpressionActionsSettings & actions_settings,
         bool enable_multiple_prewhere_read_steps);
 
+    void addPartLevelToChunk(bool add_part_level_) { add_part_level = add_part_level_; }
+
 private:
     /// This struct allow to return block with no columns but with non-zero number of rows similar to Chunk
     struct BlockAndProgress
@@ -109,6 +111,9 @@ private:
     /// A result of getHeader(). A chunk which this header is returned from read().
     Block result_header;
 
+    /// Should we add part level to produced chunk. Part level is useful for next steps if query has FINAL
+    bool add_part_level = false;
+
     Poco::Logger * log = &Poco::Logger::get("MergeTreeSelectProcessor");
     std::atomic<bool> is_cancelled{false};
 };
diff --git a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
index a586997360a..076dec00bcc 100644
--- a/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
+++ b/src/Storages/MergeTree/MergeTreeSequentialSource.cpp
@@ -7,10 +7,12 @@
 #include <QueryPipeline/QueryPipelineBuilder.h>
 #include <QueryPipeline/Pipe.h>
 #include <Interpreters/Context.h>
+#include <Processors/Chunk.h>
 #include <Processors/Sources/NullSource.h>
 #include <Processors/QueryPlan/QueryPlan.h>
 #include <Processors/QueryPlan/FilterStep.h>
 #include <Common/logger_useful.h>
+#include <Processors/Merges/Algorithms/MergeTreePartLevelInfo.h>
 
 namespace DB
 {
@@ -131,6 +133,7 @@ MergeTreeSequentialSource::MergeTreeSequentialSource(
         auto options = GetColumnsOptions(GetColumnsOptions::AllPhysical)
             .withExtendedObjects()
             .withSystemColumns();
+
         if (storage.supportsSubcolumns())
             options.withSubcolumns();
         columns_for_reader = storage_snapshot->getColumnsByNames(options, columns_to_read);
@@ -166,6 +169,8 @@ Chunk MergeTreeSequentialSource::generate()
 try
 {
     const auto & header = getPort().getHeader();
+    /// Part level is useful for next step for merging non-merge tree table
+    bool add_part_level = storage.merging_params.mode != MergeTreeData::MergingParams::Ordinary;
 
     if (!isCancelled() && current_row < data_part->rows_count)
     {
@@ -205,7 +210,7 @@ try
                 ++it;
             }
 
-            return Chunk(std::move(res_columns), rows_read);
+            return Chunk(std::move(res_columns), rows_read, add_part_level ? std::make_shared<MergeTreePartLevelInfo>(data_part->info.level) : nullptr);
         }
     }
     else
@@ -241,19 +246,24 @@ Pipe createMergeTreeSequentialSource(
     const StorageSnapshotPtr & storage_snapshot,
     MergeTreeData::DataPartPtr data_part,
     Names columns_to_read,
+    std::optional<MarkRanges> mark_ranges,
+    bool apply_deleted_mask,
     bool read_with_direct_io,
     bool take_column_types_from_storage,
     bool quiet,
     std::shared_ptr<std::atomic<size_t>> filtered_rows_count)
 {
+    const auto & filter_column = LightweightDeleteDescription::FILTER_COLUMN;
+
     /// The part might have some rows masked by lightweight deletes
-    const bool need_to_filter_deleted_rows = data_part->hasLightweightDelete();
-    auto columns = columns_to_read;
-    if (need_to_filter_deleted_rows)
-        columns.emplace_back(LightweightDeleteDescription::FILTER_COLUMN.name);
+    const bool need_to_filter_deleted_rows = apply_deleted_mask && data_part->hasLightweightDelete();
+    const bool has_filter_column = std::ranges::find(columns_to_read, filter_column.name) != columns_to_read.end();
+
+    if (need_to_filter_deleted_rows && !has_filter_column)
+        columns_to_read.emplace_back(filter_column.name);
 
     auto column_part_source = std::make_shared<MergeTreeSequentialSource>(
-        storage, storage_snapshot, data_part, columns, std::optional<MarkRanges>{},
+        storage, storage_snapshot, data_part, columns_to_read, std::move(mark_ranges),
         /*apply_deleted_mask=*/ false, read_with_direct_io, take_column_types_from_storage, quiet);
 
     Pipe pipe(std::move(column_part_source));
@@ -261,10 +271,10 @@ Pipe createMergeTreeSequentialSource(
     /// Add filtering step that discards deleted rows
     if (need_to_filter_deleted_rows)
     {
-        pipe.addSimpleTransform([filtered_rows_count](const Block & header)
+        pipe.addSimpleTransform([filtered_rows_count, has_filter_column](const Block & header)
         {
             return std::make_shared<FilterTransform>(
-                header, nullptr, LightweightDeleteDescription::FILTER_COLUMN.name, true, false, filtered_rows_count);
+                header, nullptr, filter_column.name, !has_filter_column, false, filtered_rows_count);
         });
     }
 
@@ -311,12 +321,12 @@ public:
         {
             const auto & primary_key = storage_snapshot->metadata->getPrimaryKey();
             const Names & primary_key_column_names = primary_key.column_names;
-            KeyCondition key_condition(filter, context, primary_key_column_names, primary_key.expression, NameSet{});
+            KeyCondition key_condition(filter, context, primary_key_column_names, primary_key.expression);
             LOG_DEBUG(log, "Key condition: {}", key_condition.toString());
 
             if (!key_condition.alwaysFalse())
                 mark_ranges = MergeTreeDataSelectExecutor::markRangesFromPKRange(
-                    data_part, metadata_snapshot, key_condition, context->getSettingsRef(), log);
+                    data_part, metadata_snapshot, key_condition, {}, context->getSettingsRef(), log);
 
             if (mark_ranges && mark_ranges->empty())
             {
@@ -325,9 +335,17 @@ public:
             }
         }
 
-        auto source = std::make_unique<MergeTreeSequentialSource>(
-            storage, storage_snapshot, data_part, columns_to_read,
-            std::move(mark_ranges), apply_deleted_mask, false, true);
+        auto source = createMergeTreeSequentialSource(
+            storage,
+            storage_snapshot,
+            data_part,
+            columns_to_read,
+            std::move(mark_ranges),
+            apply_deleted_mask,
+            /*read_with_direct_io=*/ false,
+            /*take_column_types_from_storage=*/ true,
+            /*quiet=*/ false,
+            /*filtered_rows_count=*/ nullptr);
 
         pipeline.init(Pipe(std::move(source)));
     }
@@ -343,7 +361,7 @@ private:
     Poco::Logger * log;
 };
 
-void createMergeTreeSequentialSource(
+void createReadFromPartStep(
     QueryPlan & plan,
     const MergeTreeData & storage,
     const StorageSnapshotPtr & storage_snapshot,
diff --git a/src/Storages/MergeTree/MergeTreeSequentialSource.h b/src/Storages/MergeTree/MergeTreeSequentialSource.h
index fb249568e8f..396d3f76886 100644
--- a/src/Storages/MergeTree/MergeTreeSequentialSource.h
+++ b/src/Storages/MergeTree/MergeTreeSequentialSource.h
@@ -15,6 +15,8 @@ Pipe createMergeTreeSequentialSource(
     const StorageSnapshotPtr & storage_snapshot,
     MergeTreeData::DataPartPtr data_part,
     Names columns_to_read,
+    std::optional<MarkRanges> mark_ranges,
+    bool apply_deleted_mask,
     bool read_with_direct_io,
     bool take_column_types_from_storage,
     bool quiet,
@@ -22,7 +24,7 @@ Pipe createMergeTreeSequentialSource(
 
 class QueryPlan;
 
-void createMergeTreeSequentialSource(
+void createReadFromPartStep(
     QueryPlan & plan,
     const MergeTreeData & storage,
     const StorageSnapshotPtr & storage_snapshot,
diff --git a/src/Storages/MergeTree/MergeTreeSettings.cpp b/src/Storages/MergeTree/MergeTreeSettings.cpp
index 1906f130101..e0015cdeb40 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.cpp
+++ b/src/Storages/MergeTree/MergeTreeSettings.cpp
@@ -212,4 +212,14 @@ void MergeTreeSettings::sanityCheck(size_t background_pool_tasks) const
             merge_selecting_sleep_slowdown_factor);
     }
 }
+
+
+std::vector<String> MergeTreeSettings::getAllRegisteredNames() const
+{
+    std::vector<String> all_settings;
+    for (const auto & setting_field : all())
+        all_settings.push_back(setting_field.getName());
+    return all_settings;
+}
+
 }
diff --git a/src/Storages/MergeTree/MergeTreeSettings.h b/src/Storages/MergeTree/MergeTreeSettings.h
index 174b14ee034..eb6c14d7754 100644
--- a/src/Storages/MergeTree/MergeTreeSettings.h
+++ b/src/Storages/MergeTree/MergeTreeSettings.h
@@ -4,6 +4,7 @@
 #include <Core/Defines.h>
 #include <Core/BaseSettings.h>
 #include <Core/SettingsEnums.h>
+#include <Common/NamePrompter.h>
 #include <Interpreters/Context_fwd.h>
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
 
@@ -36,6 +37,12 @@ struct Settings;
     M(Float, ratio_of_defaults_for_sparse_serialization, 0.9375f, "Minimal ratio of number of default values to number of all values in column to store it in sparse serializations. If >= 1, columns will be always written in full serialization.", 0) \
     M(Bool, replace_long_file_name_to_hash, false, "If the file name for column is too long (more than 'max_file_name_length' bytes) replace it to SipHash128", 0) \
     M(UInt64, max_file_name_length, 127, "The maximal length of the file name to keep it as is without hashing", 0) \
+    M(UInt64, min_bytes_for_full_part_storage, 0, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, min_rows_for_full_part_storage, 0, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, compact_parts_max_bytes_to_buffer, 128 * 1024 * 1024, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, compact_parts_max_granules_to_buffer, 128, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, compact_parts_merge_max_bytes_to_prefetch_part, 16 * 1024 * 1024, "Only available in ClickHouse Cloud", 0) \
+    \
     /** Merge settings. */ \
     M(UInt64, merge_max_block_size, 8192, "How many rows in blocks should be formed for merge operations. By default has the same value as `index_granularity`.", 0) \
     M(UInt64, merge_max_block_size_bytes, 10 * 1024 * 1024, "How many bytes in blocks should be formed for merge operations. By default has the same value as `index_granularity_bytes`.", 0) \
@@ -67,7 +74,6 @@ struct Settings;
     M(Bool, min_age_to_force_merge_on_partition_only, false, "Whether min_age_to_force_merge_seconds should be applied only on the entire partition and not on subset.", false) \
     M(UInt64, number_of_free_entries_in_pool_to_execute_optimize_entire_partition, 25, "When there is less than specified number of free entries in pool, do not try to execute optimize entire partition with a merge (this merge is created when set min_age_to_force_merge_seconds > 0 and min_age_to_force_merge_on_partition_only = true). This is to leave free threads for regular merges and avoid \"Too many parts\"", 0) \
     M(Bool, remove_rolled_back_parts_immediately, 1, "Setting for an incomplete experimental feature.", 0) \
-    M(CleanDeletedRows, clean_deleted_rows, CleanDeletedRows::Never, "Is the Replicated Merge cleanup has to be done automatically at each merge or manually (possible values are 'Always'/'Never' (default))", 0) \
     M(UInt64, replicated_max_mutations_in_one_entry, 10000, "Max number of mutation commands that can be merged together and executed in one MUTATE_PART entry (0 means unlimited)", 0) \
     M(UInt64, number_of_mutations_to_delay, 500, "If table has at least that many unfinished mutations, artificially slow down mutations of table. Disabled if set to 0", 0) \
     M(UInt64, number_of_mutations_to_throw, 1000, "If table has at least that many unfinished mutations, throw 'Too many mutations' exception. Disabled if set to 0", 0) \
@@ -95,8 +101,8 @@ struct Settings;
     M(UInt64, replicated_deduplication_window_seconds, 7 * 24 * 60 * 60 /* one week */, "Similar to \"replicated_deduplication_window\", but determines old blocks by their lifetime. Hash of an inserted block will be deleted (and the block will not be deduplicated after) if it outside of one \"window\". You can set very big replicated_deduplication_window to avoid duplicating INSERTs during that period of time.", 0) \
     M(UInt64, replicated_deduplication_window_for_async_inserts, 10000, "How many last hash values of async_insert blocks should be kept in ZooKeeper (old blocks will be deleted).", 0) \
     M(UInt64, replicated_deduplication_window_seconds_for_async_inserts, 7 * 24 * 60 * 60 /* one week */, "Similar to \"replicated_deduplication_window_for_async_inserts\", but determines old blocks by their lifetime. Hash of an inserted block will be deleted (and the block will not be deduplicated after) if it outside of one \"window\". You can set very big replicated_deduplication_window to avoid duplicating INSERTs during that period of time.", 0) \
-    M(Milliseconds, async_block_ids_cache_min_update_interval_ms, 100, "minimum interval between updates of async_block_ids_cache", 0) \
-    M(Bool, use_async_block_ids_cache, false, "use in-memory cache to filter duplicated async inserts based on block ids", 0) \
+    M(Milliseconds, async_block_ids_cache_update_wait_ms, 100, "How long each insert iteration will wait for async_block_ids_cache update", 0) \
+    M(Bool, use_async_block_ids_cache, true, "Use in-memory cache to filter duplicated async inserts based on block ids", 0) \
     M(UInt64, max_replicated_logs_to_keep, 1000, "How many records may be in log, if there is inactive replica. Inactive replica becomes lost when when this number exceed.", 0) \
     M(UInt64, min_replicated_logs_to_keep, 10, "Keep about this number of last records in ZooKeeper log, even if they are obsolete. It doesn't affect work of tables: used only to diagnose ZooKeeper log before cleaning.", 0) \
     M(Seconds, prefer_fetch_merged_part_time_threshold, 3600, "If time passed after replication log entry creation exceeds this threshold and sum size of parts is greater than \"prefer_fetch_merged_part_size_threshold\", prefer fetching merged part from replica instead of doing merge locally. To speed up very long merges.", 0) \
@@ -110,10 +116,6 @@ struct Settings;
     M(UInt64, max_files_to_modify_in_alter_columns, 75, "Not apply ALTER if number of files for modification(deletion, addition) more than this.", 0) \
     M(UInt64, max_files_to_remove_in_alter_columns, 50, "Not apply ALTER, if number of files for deletion more than this.", 0) \
     M(Float, replicated_max_ratio_of_wrong_parts, 0.5, "If ratio of wrong parts to total number of parts is less than this - allow to start.", 0) \
-    M(UInt64, replicated_max_parallel_fetches_for_host, DEFAULT_COUNT_OF_HTTP_CONNECTIONS_PER_ENDPOINT, "Limit parallel fetches from endpoint (actually pool size).", 0) \
-    M(Seconds, replicated_fetches_http_connection_timeout, 0, "HTTP connection timeout for part fetch requests. Inherited from default profile `http_connection_timeout` if not set explicitly.", 0) \
-    M(Seconds, replicated_fetches_http_send_timeout, 0, "HTTP send timeout for part fetch requests. Inherited from default profile `http_send_timeout` if not set explicitly.", 0) \
-    M(Seconds, replicated_fetches_http_receive_timeout, 0, "HTTP receive timeout for fetch part requests. Inherited from default profile `http_receive_timeout` if not set explicitly.", 0) \
     M(Bool, replicated_can_become_leader, true, "If true, Replicated tables replicas on this node will try to acquire leadership.", 0) \
     M(Seconds, zookeeper_session_expiration_check_period, 60, "ZooKeeper session expiration check period, in seconds.", 0) \
     M(Seconds, initialization_retry_period, 60, "Retry period for table initialization, in seconds.", 0) \
@@ -124,6 +126,9 @@ struct Settings;
     M(Milliseconds, wait_for_unique_parts_send_before_shutdown_ms, 0, "Before shutdown table will wait for required amount time for unique parts (exist only on current replica) to be fetched by other replicas (0 means disabled).", 0) \
     M(Float, fault_probability_before_part_commit, 0, "For testing. Do not change it.", 0) \
     M(Float, fault_probability_after_part_commit, 0, "For testing. Do not change it.", 0) \
+    M(Bool, shared_merge_tree_disable_merges_and_mutations_assignment, false, "Only available in ClickHouse Cloud", 0) \
+    M(Float, shared_merge_tree_partitions_hint_ratio_to_reload_merge_pred_for_mutations, 0.5, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, shared_merge_tree_parts_load_batch_size, 32, "Only available in ClickHouse Cloud", 0) \
     \
     /** Check delay of replicas settings. */ \
     M(UInt64, min_relative_delay_to_measure, 120, "Calculate relative replica delay only if absolute delay is not less that this value.", 0) \
@@ -131,6 +136,10 @@ struct Settings;
     M(UInt64, max_cleanup_delay_period, 300, "Maximum period to clean old queue logs, blocks hashes and parts.", 0) \
     M(UInt64, cleanup_delay_period_random_add, 10, "Add uniformly distributed value from 0 to x seconds to cleanup_delay_period to avoid thundering herd effect and subsequent DoS of ZooKeeper in case of very large number of tables.", 0) \
     M(UInt64, cleanup_thread_preferred_points_per_iteration, 150, "Preferred batch size for background cleanup (points are abstract but 1 point is approximately equivalent to 1 inserted block).", 0) \
+    M(UInt64, cleanup_threads, 128, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, kill_delay_period, 30, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, kill_delay_period_random_add, 10, "Only available in ClickHouse Cloud", 0) \
+    M(UInt64, kill_threads, 128, "Only available in ClickHouse Cloud", 0) \
     M(UInt64, min_relative_delay_to_close, 300, "Minimal delay from other replicas to close, stop serving requests and not return Ok during status check.", 0) \
     M(UInt64, min_absolute_delay_to_close, 0, "Minimal absolute delay to close, stop serving requests and not return Ok during status check.", 0) \
     M(UInt64, enable_vertical_merge_algorithm, 1, "Enable usage of Vertical merge algorithm.", 0) \
@@ -170,14 +179,20 @@ struct Settings;
     M(UInt64, zero_copy_merge_mutation_min_parts_size_sleep_before_lock, 1ULL * 1024 * 1024 * 1024, "If zero copy replication is enabled sleep random amount of time before trying to lock depending on parts size for merge or mutation", 0) \
     M(Bool, allow_floating_point_partition_key, false, "Allow floating point as partition key", 0) \
     M(UInt64, sleep_before_loading_outdated_parts_ms, 0, "For testing. Do not change it.", 0) \
+    M(Bool, always_use_copy_instead_of_hardlinks, false, "Always copy data instead of hardlinking during mutations/replaces/detaches and so on.", 0) \
+    M(Bool, disable_freeze_partition_for_zero_copy_replication, true, "Disable FREEZE PARTITION query for zero copy replication.", 0) \
+    M(Bool, disable_detach_partition_for_zero_copy_replication, true, "Disable DETACH PARTITION query for zero copy replication.", 0) \
+    M(Bool, disable_fetch_partition_for_zero_copy_replication, true, "Disable FETCH PARTITION query for zero copy replication.", 0) \
     \
     /** Experimental/work in progress feature. Unsafe for production. */ \
     M(UInt64, part_moves_between_shards_enable, 0, "Experimental/Incomplete feature to move parts between shards. Does not take into account sharding expressions.", 0) \
     M(UInt64, part_moves_between_shards_delay_seconds, 30, "Time to wait before/after moving parts between shards.", 0) \
     M(Bool, allow_remote_fs_zero_copy_replication, false, "Don't use this setting in production, because it is not ready.", 0) \
     M(String, remote_fs_zero_copy_zookeeper_path, "/clickhouse/zero_copy", "ZooKeeper path for zero-copy table-independent info.", 0) \
-    M(Bool, remote_fs_zero_copy_path_compatible_mode, false, "Run zero-copy in compatible mode during conversion process.", 0)                                                                                                                                       \
+    M(Bool, remote_fs_zero_copy_path_compatible_mode, false, "Run zero-copy in compatible mode during conversion process.", 0) \
+    M(Bool, cache_populated_by_fetch, false, "Only available in ClickHouse Cloud", 0) \
     M(Bool, allow_experimental_block_number_column, false, "Enable persisting column _block_number for each row.", 0) \
+    M(Bool, allow_experimental_replacing_merge_with_cleanup, false, "Allow experimental CLEANUP merges for ReplacingMergeTree with is_deleted column.", 0) \
     \
     /** Compress marks and primary key. */ \
     M(Bool, compress_marks, true, "Marks support compression, reduce mark file size and speed up network transmission.", 0) \
@@ -186,6 +201,9 @@ struct Settings;
     M(String, primary_key_compression_codec, "ZSTD(3)", "Compression encoding used by primary, primary key is small enough and cached, so the default compression is ZSTD(3).", 0) \
     M(UInt64, marks_compress_block_size, 65536, "Mark compress block size, the actual size of the block to compress.", 0) \
     M(UInt64, primary_key_compress_block_size, 65536, "Primary compress block size, the actual size of the block to compress.", 0) \
+    \
+    /** Projection settings. */ \
+    M(UInt64, max_projections, 25, "The maximum number of merge tree projections.", 0) \
 
 #define MAKE_OBSOLETE_MERGE_TREE_SETTING(M, TYPE, NAME, DEFAULT) \
     M(TYPE, NAME, DEFAULT, "Obsolete setting, does nothing.", BaseSettingsHelpers::Flags::OBSOLETE)
@@ -211,6 +229,11 @@ struct Settings;
     MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Bool, use_metadata_cache, false) \
     MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, merge_tree_enable_clear_old_broken_detached, 0) \
     MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, merge_tree_clear_old_broken_detached_parts_ttl_timeout_seconds, 1ULL * 3600 * 24 * 30) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Seconds, replicated_fetches_http_connection_timeout, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Seconds, replicated_fetches_http_send_timeout, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, Seconds, replicated_fetches_http_receive_timeout, 0) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, UInt64, replicated_max_parallel_fetches_for_host, DEFAULT_COUNT_OF_HTTP_CONNECTIONS_PER_ENDPOINT) \
+    MAKE_OBSOLETE_MERGE_TREE_SETTING(M, CleanDeletedRows, clean_deleted_rows, CleanDeletedRows::Never) \
 
     /// Settings that should not change after the creation of a table.
     /// NOLINTNEXTLINE
@@ -227,7 +250,7 @@ DECLARE_SETTINGS_TRAITS(MergeTreeSettingsTraits, LIST_OF_MERGE_TREE_SETTINGS)
 /** Settings for the MergeTree family of engines.
   * Could be loaded from config or from a CREATE TABLE query (SETTINGS clause).
   */
-struct MergeTreeSettings : public BaseSettings<MergeTreeSettingsTraits>
+struct MergeTreeSettings : public BaseSettings<MergeTreeSettingsTraits>, public IHints<2>
 {
     void loadFromConfig(const String & config_elem, const Poco::Util::AbstractConfiguration & config);
 
@@ -248,6 +271,8 @@ struct MergeTreeSettings : public BaseSettings<MergeTreeSettingsTraits>
 
     /// Check that the values are sane taking also query-level settings into account.
     void sanityCheck(size_t background_pool_tasks) const;
+
+    std::vector<String> getAllRegisteredNames() const override;
 };
 
 using MergeTreeSettingsPtr = std::shared_ptr<const MergeTreeSettings>;
diff --git a/src/Storages/MergeTree/MergedBlockOutputStream.cpp b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
index 07a204d4325..8b34c221eec 100644
--- a/src/Storages/MergeTree/MergedBlockOutputStream.cpp
+++ b/src/Storages/MergeTree/MergedBlockOutputStream.cpp
@@ -184,6 +184,7 @@ MergedBlockOutputStream::Finalizer MergedBlockOutputStream::finalizePartAsync(
     new_part->index = writer->releaseIndexColumns();
     new_part->checksums = checksums;
     new_part->setBytesOnDisk(checksums.getTotalSizeOnDisk());
+    new_part->setBytesUncompressedOnDisk(checksums.getTotalSizeUncompressedOnDisk());
     new_part->index_granularity = writer->getIndexGranularity();
     new_part->calculateColumnsAndSecondaryIndicesSizesOnDisk();
 
diff --git a/src/Storages/MergeTree/MutateTask.cpp b/src/Storages/MergeTree/MutateTask.cpp
index 214a7ea56a1..e4070aa8262 100644
--- a/src/Storages/MergeTree/MutateTask.cpp
+++ b/src/Storages/MergeTree/MutateTask.cpp
@@ -51,7 +51,6 @@ static bool checkOperationIsNotCanceled(ActionBlocker & merges_blocker, MergeLis
     return true;
 }
 
-
 /** Split mutation commands into two parts:
 *   First part should be executed by mutations interpreter.
 *   Other is just simple drop/renames, so they can be executed without interpreter.
@@ -79,7 +78,8 @@ static void splitAndModifyMutationCommands(
                 || command.type == MutationCommand::Type::MATERIALIZE_PROJECTION
                 || command.type == MutationCommand::Type::MATERIALIZE_TTL
                 || command.type == MutationCommand::Type::DELETE
-                || command.type == MutationCommand::Type::UPDATE)
+                || command.type == MutationCommand::Type::UPDATE
+                || command.type == MutationCommand::Type::APPLY_DELETED_MASK)
             {
                 for_interpreter.push_back(command);
                 for (const auto & [column_name, expr] : command.column_to_update_expression)
@@ -202,7 +202,8 @@ static void splitAndModifyMutationCommands(
                 || command.type == MutationCommand::Type::MATERIALIZE_PROJECTION
                 || command.type == MutationCommand::Type::MATERIALIZE_TTL
                 || command.type == MutationCommand::Type::DELETE
-                || command.type == MutationCommand::Type::UPDATE)
+                || command.type == MutationCommand::Type::UPDATE
+                || command.type == MutationCommand::Type::APPLY_DELETED_MASK)
             {
                 for_interpreter.push_back(command);
             }
@@ -257,15 +258,12 @@ getColumnsForNewDataPart(
     NameToNameMap renamed_columns_from_to;
     ColumnsDescription part_columns(source_part->getColumns());
     NamesAndTypesList system_columns;
-    if (source_part->supportLightweightDeleteMutate())
-        system_columns.push_back(LightweightDeleteDescription::FILTER_COLUMN);
 
-    /// Preserve system columns that have persisted values in the source_part
-    for (const auto & column : system_columns)
-    {
-        if (part_columns.has(column.name) && !storage_columns.contains(column.name))
-            storage_columns.emplace_back(column);
-    }
+    const auto & deleted_mask_column = LightweightDeleteDescription::FILTER_COLUMN;
+    bool supports_lightweight_deletes = source_part->supportLightweightDeleteMutate();
+
+    bool deleted_mask_updated = false;
+    bool has_delete_command = false;
 
     NameSet storage_columns_set;
     for (const auto & [name, _] : storage_columns)
@@ -277,23 +275,22 @@ getColumnsForNewDataPart(
         {
             for (const auto & [column_name, _] : command.column_to_update_expression)
             {
-                /// Allow to update and persist values of system column
-                auto column = system_columns.tryGetByName(column_name);
-                if (column && !storage_columns.contains(column_name))
-                    storage_columns.emplace_back(column_name, column->type);
+                if (column_name == deleted_mask_column.name
+                    && supports_lightweight_deletes
+                    && !storage_columns_set.contains(deleted_mask_column.name))
+                    deleted_mask_updated = true;
             }
         }
 
+        if (command.type == MutationCommand::DELETE || command.type == MutationCommand::APPLY_DELETED_MASK)
+            has_delete_command = true;
+
         /// If we don't have this column in source part, than we don't need to materialize it
         if (!part_columns.has(command.column_name))
-        {
             continue;
-        }
 
         if (command.type == MutationCommand::DROP_COLUMN)
-        {
             removed_columns.insert(command.column_name);
-        }
 
         if (command.type == MutationCommand::RENAME_COLUMN)
         {
@@ -302,6 +299,15 @@ getColumnsForNewDataPart(
         }
     }
 
+    if (!storage_columns_set.contains(deleted_mask_column.name))
+    {
+        if (deleted_mask_updated || (part_columns.has(deleted_mask_column.name) && !has_delete_command))
+        {
+            storage_columns.push_back(deleted_mask_column);
+            storage_columns_set.insert(deleted_mask_column.name);
+        }
+    }
+
     SerializationInfoByName new_serialization_infos;
     for (const auto & [name, old_info] : serialization_infos)
     {
@@ -873,6 +879,7 @@ void finalizeMutatedPart(
     /// All information about sizes is stored in checksums.
     /// It doesn't make sense to touch filesystem for sizes.
     new_data_part->setBytesOnDisk(new_data_part->checksums.getTotalSizeOnDisk());
+    new_data_part->setBytesUncompressedOnDisk(new_data_part->checksums.getTotalSizeUncompressedOnDisk());
     /// Also use information from checksums
     new_data_part->calculateColumnsAndSecondaryIndicesSizesOnDisk();
 
@@ -1357,6 +1364,7 @@ private:
         NameSet removed_stats;
         /// A stat file need to be renamed iff the column is renamed.
         NameToNameMap renamed_stats;
+
         for (const auto & command : ctx->for_file_renames)
         {
             if (command.type == MutationCommand::DROP_INDEX)
@@ -1530,7 +1538,8 @@ private:
 
         for (auto & command_for_interpreter : ctx->for_interpreter)
         {
-            if (command_for_interpreter.type == MutationCommand::DELETE)
+            if (command_for_interpreter.type == MutationCommand::DELETE
+                || command_for_interpreter.type == MutationCommand::APPLY_DELETED_MASK)
             {
                 has_delete = true;
                 break;
@@ -1652,6 +1661,8 @@ private:
         ctx->new_data_part->version.setCreationTID(tid, nullptr);
         ctx->new_data_part->storeVersionMetadata();
 
+        auto settings = ctx->source_part->storage.getSettings();
+
         NameSet hardlinked_files;
 
         /// NOTE: Renames must be done in order
@@ -1691,9 +1702,18 @@ private:
 
             if (it->isFile())
             {
-                ctx->new_data_part->getDataPartStorage().createHardLinkFrom(
-                    ctx->source_part->getDataPartStorage(), file_name, destination);
-                hardlinked_files.insert(file_name);
+                if (settings->always_use_copy_instead_of_hardlinks)
+                {
+                    ctx->new_data_part->getDataPartStorage().copyFileFrom(
+                        ctx->source_part->getDataPartStorage(), it->name(), destination);
+                }
+                else
+                {
+                    ctx->new_data_part->getDataPartStorage().createHardLinkFrom(
+                        ctx->source_part->getDataPartStorage(), it->name(), destination);
+
+                    hardlinked_files.insert(it->name());
+                }
             }
             else if (!endsWith(it->name(), ".tmp_proj")) // ignore projection tmp merge dir
             {
@@ -1705,11 +1725,20 @@ private:
 
                 for (auto p_it = projection_data_part_storage_src->iterate(); p_it->isValid(); p_it->next())
                 {
-                    auto file_name_with_projection_prefix = fs::path(projection_data_part_storage_src->getPartDirectory()) / p_it->name();
-                    projection_data_part_storage_dst->createHardLinkFrom(
-                        *projection_data_part_storage_src, p_it->name(), p_it->name());
+                    if (settings->always_use_copy_instead_of_hardlinks)
+                    {
+                        projection_data_part_storage_dst->copyFileFrom(
+                            *projection_data_part_storage_src, p_it->name(), p_it->name());
+                    }
+                    else
+                    {
+                        auto file_name_with_projection_prefix = fs::path(projection_data_part_storage_src->getPartDirectory()) / p_it->name();
 
-                    hardlinked_files.insert(file_name_with_projection_prefix);
+                        projection_data_part_storage_dst->createHardLinkFrom(
+                            *projection_data_part_storage_src, p_it->name(), p_it->name());
+
+                        hardlinked_files.insert(file_name_with_projection_prefix);
+                    }
                 }
             }
         }
@@ -1917,6 +1946,9 @@ static bool canSkipMutationCommandForPart(const MergeTreeDataPartPtr & part, con
             return true;
     }
 
+    if (command.type == MutationCommand::APPLY_DELETED_MASK && !part->hasLightweightDelete())
+        return true;
+
     if (canSkipConversionToNullable(part, command))
         return true;
 
@@ -1973,19 +2005,20 @@ bool MutateTask::prepare()
         IDataPartStorage::ClonePartParams clone_params
         {
             .txn = ctx->txn, .hardlinked_files = &ctx->hardlinked_files,
-            .files_to_copy_instead_of_hardlinks = std::move(files_to_copy_instead_of_hardlinks), .keep_metadata_version = true
+            .copy_instead_of_hardlink = settings_ptr->always_use_copy_instead_of_hardlinks,
+            .files_to_copy_instead_of_hardlinks = std::move(files_to_copy_instead_of_hardlinks),
+            .keep_metadata_version = true,
         };
-        auto [part, lock] = ctx->data->cloneAndLoadDataPartOnSameDisk(
-            ctx->source_part,
-            prefix,
-            ctx->future_part->part_info,
-            ctx->metadata_snapshot,
-            clone_params,
-            ctx->context->getReadSettings(),
-            ctx->context->getWriteSettings());
-        part->getDataPartStorage().beginTransaction();
+        MergeTreeData::MutableDataPartPtr part;
+        scope_guard lock;
+
+        {
+            std::tie(part, lock) = ctx->data->cloneAndLoadDataPartOnSameDisk(
+                ctx->source_part, prefix, ctx->future_part->part_info, ctx->metadata_snapshot, clone_params, ctx->context->getReadSettings(), ctx->context->getWriteSettings());
+            part->getDataPartStorage().beginTransaction();
+            ctx->temporary_directory_lock = std::move(lock);
+        }
 
-        ctx->temporary_directory_lock = std::move(lock);
         promise.set_value(std::move(part));
         return false;
     }
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
index 9137dc89705..333a0590d6b 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.cpp
@@ -23,6 +23,11 @@
 #include <fmt/core.h>
 #include <fmt/format.h>
 
+namespace ProfileEvents
+{
+    extern const Event ParallelReplicasUsedCount;
+}
+
 namespace DB
 {
 struct Part
@@ -161,26 +166,44 @@ void DefaultCoordinator::updateReadingState(InitialAllRangesAnnouncement announc
     PartRefs parts_diff;
 
     /// To get rid of duplicates
-    for (auto && part: announcement.description)
+    for (auto && part_ranges: announcement.description)
     {
-        auto the_same_it = std::find_if(all_parts_to_read.begin(), all_parts_to_read.end(),
-            [&part] (const Part & other) { return other.description.info.getPartNameV1() == part.info.getPartNameV1(); });
+        Part part{.description = std::move(part_ranges), .replicas = {announcement.replica_num}};
+        const MergeTreePartInfo & announced_part = part.description.info;
 
-        /// We have the same part - add the info about presence on current replica to it
-        if (the_same_it != all_parts_to_read.end())
+        auto it = std::lower_bound(cbegin(all_parts_to_read), cend(all_parts_to_read), part);
+        if (it != all_parts_to_read.cend())
         {
-            the_same_it->replicas.insert(announcement.replica_num);
-            continue;
+            const MergeTreePartInfo & found_part = it->description.info;
+            if (found_part == announced_part)
+            {
+                /// We have the same part - add the info about presence on current replica
+                it->replicas.insert(announcement.replica_num);
+                continue;
+            }
+            else
+            {
+                /// check if it is covering or covered part
+                /// need to compare with 2 nearest parts in set, - lesser and greater than the part from the announcement
+                bool is_disjoint = found_part.isDisjoint(announced_part);
+                if (it != all_parts_to_read.cbegin() && is_disjoint)
+                {
+                    const MergeTreePartInfo & lesser_part = (--it)->description.info;
+                    is_disjoint &= lesser_part.isDisjoint(announced_part);
+                }
+                if (!is_disjoint)
+                    continue;
+            }
+        }
+        else if (!all_parts_to_read.empty())
+        {
+            /// the announced part is greatest - check if it's disjoint with lesser part
+            const MergeTreePartInfo & lesser_part = all_parts_to_read.crbegin()->description.info;
+            if (!lesser_part.isDisjoint(announced_part))
+                continue;
         }
 
-        auto covering_or_the_same_it = std::find_if(all_parts_to_read.begin(), all_parts_to_read.end(),
-            [&part] (const Part & other) { return !other.description.info.isDisjoint(part.info); });
-
-        /// It is covering part or we have covering - skip it
-        if (covering_or_the_same_it != all_parts_to_read.end())
-            continue;
-
-        auto [insert_it, _] = all_parts_to_read.emplace(Part{.description = std::move(part), .replicas = {announcement.replica_num}});
+        auto [insert_it, _] = all_parts_to_read.emplace(std::move(part));
         parts_diff.push_back(insert_it);
     }
 
@@ -205,13 +228,16 @@ void DefaultCoordinator::updateReadingState(InitialAllRangesAnnouncement announc
 
 void DefaultCoordinator::markReplicaAsUnavailable(size_t replica_number)
 {
-    LOG_DEBUG(log, "Replica number {} is unavailable", replica_number);
+    if (stats[replica_number].is_unavailable == false)
+    {
+        LOG_DEBUG(log, "Replica number {} is unavailable", replica_number);
 
-    ++unavailable_replicas_count;
-    stats[replica_number].is_unavailable = true;
+        stats[replica_number].is_unavailable = true;
+        ++unavailable_replicas_count;
 
-    if (sent_initial_requests == replicas_count - unavailable_replicas_count)
-        finalizeReadingState();
+        if (sent_initial_requests == replicas_count - unavailable_replicas_count)
+            finalizeReadingState();
+    }
 }
 
 void DefaultCoordinator::finalizeReadingState()
@@ -300,20 +326,20 @@ void DefaultCoordinator::selectPartsAndRanges(const PartRefs & container, size_t
         while (!part->description.ranges.empty() && current_mark_size < min_number_of_marks)
         {
             auto & range = part->description.ranges.front();
+            const size_t needed = min_number_of_marks - current_mark_size;
 
-            if (range.getNumberOfMarks() > min_number_of_marks)
+            if (range.getNumberOfMarks() > needed)
             {
-                auto new_range = range;
-                range.begin += min_number_of_marks;
-                new_range.end = new_range.begin + min_number_of_marks;
+                auto range_we_take = MarkRange{range.begin, range.begin + needed};
+                response.description.back().ranges.emplace_back(range_we_take);
+                current_mark_size += range_we_take.getNumberOfMarks();
 
-                response.description.back().ranges.emplace_back(new_range);
-                current_mark_size += new_range.getNumberOfMarks();
-                continue;
+                range.begin += needed;
+                break;
             }
 
-            current_mark_size += part->description.ranges.front().getNumberOfMarks();
-            response.description.back().ranges.emplace_back(part->description.ranges.front());
+            response.description.back().ranges.emplace_back(range);
+            current_mark_size += range.getNumberOfMarks();
             part->description.ranges.pop_front();
         }
     }
@@ -387,12 +413,13 @@ public:
 template <CoordinationMode mode>
 void InOrderCoordinator<mode>::markReplicaAsUnavailable(size_t replica_number)
 {
-    LOG_DEBUG(log, "Replica number {} is unavailable", replica_number);
+    if (stats[replica_number].is_unavailable == false)
+    {
+        LOG_DEBUG(log, "Replica number {} is unavailable", replica_number);
 
-    stats[replica_number].is_unavailable = true;
-    ++unavailable_replicas_count;
-
-    /// There is nothing to do else.
+        stats[replica_number].is_unavailable = true;
+        ++unavailable_replicas_count;
+    }
 }
 
 template <CoordinationMode mode>
@@ -473,23 +500,21 @@ ParallelReadResponse InOrderCoordinator<mode>::handleRequest(ParallelReadRequest
         {
             while (!global_part_it->description.ranges.empty() && current_mark_size < request.min_number_of_marks)
             {
-                auto range = global_part_it->description.ranges.back();
+                auto & range = global_part_it->description.ranges.back();
+                const size_t needed = request.min_number_of_marks - current_mark_size;
 
-                if (range.getNumberOfMarks() > request.min_number_of_marks)
+                if (range.getNumberOfMarks() > needed)
                 {
-                    auto new_range = range;
-                    range.end -= request.min_number_of_marks;
-                    new_range.begin = new_range.end - request.min_number_of_marks;
+                    auto range_we_take = MarkRange{range.end - needed, range.end};
+                    part.ranges.emplace_front(range_we_take);
+                    current_mark_size += range_we_take.getNumberOfMarks();
 
-                    global_part_it->description.ranges.back() = range;
-
-                    part.ranges.emplace_front(new_range);
-                    current_mark_size += new_range.getNumberOfMarks();
-                    continue;
+                    range.end -= needed;
+                    break;
                 }
 
-                current_mark_size += global_part_it->description.ranges.back().getNumberOfMarks();
-                part.ranges.emplace_front(global_part_it->description.ranges.back());
+                part.ranges.emplace_front(range);
+                current_mark_size += range.getNumberOfMarks();
                 global_part_it->description.ranges.pop_back();
             }
         }
@@ -497,23 +522,21 @@ ParallelReadResponse InOrderCoordinator<mode>::handleRequest(ParallelReadRequest
         {
             while (!global_part_it->description.ranges.empty() && current_mark_size < request.min_number_of_marks)
             {
-                auto range = global_part_it->description.ranges.front();
+                auto & range = global_part_it->description.ranges.front();
+                const size_t needed = request.min_number_of_marks - current_mark_size;
 
-                if (range.getNumberOfMarks() > request.min_number_of_marks)
+                if (range.getNumberOfMarks() > needed)
                 {
-                    auto new_range = range;
-                    range.begin += request.min_number_of_marks;
-                    new_range.end = new_range.begin + request.min_number_of_marks;
+                    auto range_we_take = MarkRange{range.begin, range.begin + needed};
+                    part.ranges.emplace_back(range_we_take);
+                    current_mark_size += range_we_take.getNumberOfMarks();
 
-                    global_part_it->description.ranges.front() = range;
-
-                    part.ranges.emplace_back(new_range);
-                    current_mark_size += new_range.getNumberOfMarks();
-                    continue;
+                    range.begin += needed;
+                    break;
                 }
 
-                current_mark_size += global_part_it->description.ranges.front().getNumberOfMarks();
-                part.ranges.emplace_back(global_part_it->description.ranges.front());
+                part.ranges.emplace_back(range);
+                current_mark_size += range.getNumberOfMarks();
                 global_part_it->description.ranges.pop_front();
             }
         }
@@ -555,7 +578,15 @@ ParallelReadResponse ParallelReplicasReadingCoordinator::handleRequest(ParallelR
         initialize();
     }
 
-    return pimpl->handleRequest(std::move(request));
+    const auto replica_num = request.replica_num;
+    auto response = pimpl->handleRequest(std::move(request));
+    if (!response.finish)
+    {
+        if (replicas_used.insert(replica_num).second)
+            ProfileEvents::increment(ProfileEvents::ParallelReplicasUsedCount);
+    }
+
+    return response;
 }
 
 void ParallelReplicasReadingCoordinator::markReplicaAsUnavailable(size_t replica_number)
@@ -563,11 +594,9 @@ void ParallelReplicasReadingCoordinator::markReplicaAsUnavailable(size_t replica
     std::lock_guard lock(mutex);
 
     if (!pimpl)
-    {
-        initialize();
-    }
-
-    return pimpl->markReplicaAsUnavailable(replica_number);
+        unavailable_nodes_registered_before_initialization.push_back(replica_number);
+    else
+        pimpl->markReplicaAsUnavailable(replica_number);
 }
 
 void ParallelReplicasReadingCoordinator::initialize()
@@ -584,8 +613,12 @@ void ParallelReplicasReadingCoordinator::initialize()
             pimpl = std::make_unique<InOrderCoordinator<CoordinationMode::ReverseOrder>>(replicas_count);
             break;
     }
+
     if (progress_callback)
         pimpl->setProgressCallback(std::move(progress_callback));
+
+    for (const auto replica : unavailable_nodes_registered_before_initialization)
+        pimpl->markReplicaAsUnavailable(replica);
 }
 
 ParallelReplicasReadingCoordinator::ParallelReplicasReadingCoordinator(size_t replicas_count_) : replicas_count(replicas_count_) {}
diff --git a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h
index 449421797ce..acc265c124f 100644
--- a/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h
+++ b/src/Storages/MergeTree/ParallelReplicasReadingCoordinator.h
@@ -39,6 +39,12 @@ private:
     std::atomic<bool> initialized{false};
     std::unique_ptr<ImplInterface> pimpl;
     ProgressCallback progress_callback; // store the callback only to bypass it to coordinator implementation
+    std::set<size_t> replicas_used;
+
+    /// To initialize `pimpl` we need to know the coordinator mode. We can know it only from initial announcement or regular request.
+    /// The problem is `markReplicaAsUnavailable` might be called before any of these requests happened.
+    /// In this case we will remember the numbers of unavailable replicas and apply this knowledge later on initialization.
+    std::vector<size_t> unavailable_nodes_registered_before_initialization;
 };
 
 using ParallelReplicasReadingCoordinatorPtr = std::shared_ptr<ParallelReplicasReadingCoordinator>;
diff --git a/src/Storages/MergeTree/PartitionPruner.cpp b/src/Storages/MergeTree/PartitionPruner.cpp
index a5df08e3df9..c559ba4371a 100644
--- a/src/Storages/MergeTree/PartitionPruner.cpp
+++ b/src/Storages/MergeTree/PartitionPruner.cpp
@@ -10,7 +10,7 @@ namespace
 KeyCondition buildKeyCondition(const KeyDescription & partition_key, const SelectQueryInfo & query_info, ContextPtr context, bool strict)
 {
     if (context->getSettingsRef().allow_experimental_analyzer)
-        return {query_info.filter_actions_dag, context, partition_key.column_names, partition_key.expression, {}, true /* single_point */, strict};
+        return {query_info.filter_actions_dag, context, partition_key.column_names, partition_key.expression, true /* single_point */, strict};
 
     return {query_info, context, partition_key.column_names, partition_key.expression, true /* single_point */, strict};
 }
@@ -26,7 +26,7 @@ PartitionPruner::PartitionPruner(const StorageMetadataPtr & metadata, const Sele
 
 PartitionPruner::PartitionPruner(const StorageMetadataPtr & metadata, ActionsDAGPtr filter_actions_dag, ContextPtr context, bool strict)
     : partition_key(MergeTreePartition::adjustPartitionKey(metadata, context))
-    , partition_condition(filter_actions_dag, context, partition_key.column_names, partition_key.expression, {}, true /* single_point */, strict)
+    , partition_condition(filter_actions_dag, context, partition_key.column_names, partition_key.expression, true /* single_point */, strict)
     , useless(strict ? partition_condition.anyUnknownOrAlwaysTrue() : partition_condition.alwaysUnknownOrTrue())
 {
 }
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
index bb74c4dd7bb..2d0617e5826 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeQueue.cpp
@@ -1935,7 +1935,7 @@ bool ReplicatedMergeTreeQueue::tryFinalizeMutations(zkutil::ZooKeeperPtr zookeep
 
     /// We need to check committing block numbers and new parts which could be committed.
     /// Actually we don't need most of predicate logic here but it all the code related to committing blocks
-    /// and updatating queue state is implemented there.
+    /// and updating queue state is implemented there.
     PartitionIdsHint partition_ids_hint;
     for (const auto & candidate : candidates)
         for (const auto & partitions : candidate->block_numbers)
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.cpp
index d83e9c3f805..579592b0b3e 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeRestartingThread.cpp
@@ -290,7 +290,7 @@ void ReplicatedMergeTreeRestartingThread::activateReplica()
     ReplicatedMergeTreeAddress address = storage.getReplicatedMergeTreeAddress();
 
     String is_active_path = fs::path(storage.replica_path) / "is_active";
-    zookeeper->handleEphemeralNodeExistence(is_active_path, active_node_identifier);
+    zookeeper->deleteEphemeralNodeIfContentMatches(is_active_path, active_node_identifier);
 
     /// Simultaneously declare that this replica is active, and update the host.
     Coordination::Requests ops;
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
index 4fa473da813..218ed3bff12 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.cpp
@@ -29,6 +29,7 @@ namespace FailPoints
 {
     extern const char replicated_merge_tree_commit_zk_fail_after_op[];
     extern const char replicated_merge_tree_insert_quorum_fail_0[];
+    extern const char replicated_merge_tree_commit_zk_fail_when_recovering_from_hw_fault[];
 }
 
 namespace ErrorCodes
@@ -39,8 +40,6 @@ namespace ErrorCodes
     extern const int READONLY;
     extern const int UNKNOWN_STATUS_OF_INSERT;
     extern const int INSERT_WAS_DEDUPLICATED;
-    extern const int TIMEOUT_EXCEEDED;
-    extern const int NO_ACTIVE_REPLICAS;
     extern const int DUPLICATE_DATA_PART;
     extern const int PART_IS_TEMPORARILY_LOCKED;
     extern const int LOGICAL_ERROR;
@@ -159,7 +158,12 @@ size_t ReplicatedMergeTreeSinkImpl<async_insert>::checkQuorumPrecondition(const
 
     size_t replicas_number = 0;
 
-    ZooKeeperRetriesControl quorum_retries_ctl("checkQuorumPrecondition", zookeeper_retries_info, context->getProcessListElement());
+    const auto & settings = context->getSettingsRef();
+    ZooKeeperRetriesControl quorum_retries_ctl(
+        "checkQuorumPrecondition",
+        log,
+        {settings.insert_keeper_max_retries, settings.insert_keeper_retry_initial_backoff_ms, settings.insert_keeper_retry_max_backoff_ms},
+        context->getProcessListElement());
     quorum_retries_ctl.retryLoop(
         [&]()
         {
@@ -254,12 +258,6 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
     auto block = getHeader().cloneWithColumns(chunk.detachColumns());
 
     const auto & settings = context->getSettingsRef();
-    zookeeper_retries_info = ZooKeeperRetriesInfo(
-        "ReplicatedMergeTreeSink::consume",
-        settings.insert_keeper_max_retries ? log : nullptr,
-        settings.insert_keeper_max_retries,
-        settings.insert_keeper_retry_initial_backoff_ms,
-        settings.insert_keeper_retry_max_backoff_ms);
 
     ZooKeeperWithFaultInjectionPtr zookeeper = ZooKeeperWithFaultInjection::createInstance(
         settings.insert_keeper_fault_injection_probability,
@@ -307,7 +305,7 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::consume(Chunk chunk)
         auto profile_events_scope = std::make_unique<ProfileEventsScope>(&part_counters);
 
         /// Some merging algorithms can mofidy the block which loses the information about the async insert offsets
-        /// when preprocessing or filtering data for asnyc inserts deduplication we want to use the initial, unmerged block
+        /// when preprocessing or filtering data for async inserts deduplication we want to use the initial, unmerged block
         std::optional<BlockWithPartition> unmerged_block;
 
         if constexpr (async_insert)
@@ -456,7 +454,7 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
     if (!delayed_chunk)
         return;
 
-    for (auto & partition: delayed_chunk->partitions)
+    for (auto & partition : delayed_chunk->partitions)
     {
         int retry_times = 0;
         /// users may have lots of same inserts. It will be helpful to deduplicate in advance.
@@ -469,6 +467,7 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
         }
 
         /// reset the cache version to zero for every partition write.
+        /// Version zero allows to avoid wait on first iteration
         cache_version = 0;
         while (true)
         {
@@ -476,6 +475,8 @@ void ReplicatedMergeTreeSinkImpl<true>::finishDelayedChunk(const ZooKeeperWithFa
             auto conflict_block_ids = commitPart(zookeeper, partition.temp_part.part, partition.block_id, delayed_chunk->replicas_num, false).first;
             if (conflict_block_ids.empty())
                 break;
+
+            storage.async_block_ids_cache.triggerCacheUpdate();
             ++retry_times;
             LOG_DEBUG(log, "Found duplicate block IDs: {}, retry times {}", toString(conflict_block_ids), retry_times);
             /// partition clean conflict
@@ -594,7 +595,6 @@ struct CommitRetryContext
     {
         LOCK_AND_COMMIT,
         DUPLICATED_PART,
-        UNCERTAIN_COMMIT,
         SUCCESS,
         ERROR
     };
@@ -602,19 +602,17 @@ struct CommitRetryContext
     /// Possible ways:
 
     /// LOCK_AND_COMMIT -> DUPLICATED_PART
-    /// LOCK_AND_COMMIT -> UNCERTAIN_COMMIT
     /// LOCK_AND_COMMIT -> SUCCESS
+    /// LOCK_AND_COMMIT -> ERROR
 
     /// DUPLICATED_PART -> SUCCESS
-    /// UNCERTAIN_COMMIT -> SUCCESS
-    /// * -> ERROR
+    /// DUPLICATED_PART -> ERROR
 
     Stages stage = LOCK_AND_COMMIT;
 
     String actual_part_name;
     std::vector<String> conflict_block_ids;
     bool part_was_deduplicated = false;
-    Coordination::Error uncertain_keeper_error = Coordination::Error::ZOK;
 };
 
 template<bool async_insert>
@@ -635,7 +633,12 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
 
     CommitRetryContext retry_context;
 
-    ZooKeeperRetriesControl retries_ctl("commitPart", zookeeper_retries_info, context->getProcessListElement());
+    const auto & settings = context->getSettingsRef();
+    ZooKeeperRetriesControl retries_ctl(
+        "commitPart",
+        log,
+        {settings.insert_keeper_max_retries, settings.insert_keeper_retry_initial_backoff_ms, settings.insert_keeper_retry_max_backoff_ms},
+        context->getProcessListElement());
 
     auto resolve_duplicate_stage = [&] () -> CommitRetryContext::Stages
     {
@@ -667,34 +670,6 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
         }
     };
 
-    auto resolve_uncertain_commit_stage = [&] () -> CommitRetryContext::Stages
-    {
-        /// check that info about the part was actually written in zk
-        if (zookeeper->exists(fs::path(storage.replica_path) / "parts" / retry_context.actual_part_name))
-        {
-            LOG_DEBUG(log, "Part was successfully committed on previous iteration: part_id={}", part->name);
-            return CommitRetryContext::SUCCESS;
-        }
-        else
-        {
-            /// if all retries will be exhausted by accessing zookeeper on fresh retry -> we'll add committed part to queue in the action
-            /// here lambda capture part name, it's ok since we'll not generate new one for this insert,
-            retries_ctl.actionAfterLastFailedRetry(
-                    [&] ()
-                    {
-                        storage.enqueuePartForCheck(retry_context.actual_part_name, MAX_AGE_OF_LOCAL_PART_THAT_WASNT_ADDED_TO_ZOOKEEPER);
-                    });
-
-            retries_ctl.setUserError(
-                    ErrorCodes::UNEXPECTED_ZOOKEEPER_ERROR,
-                    "Insert failed due to zookeeper error. Please retry. Reason: {}",
-                    retry_context.uncertain_keeper_error);
-
-            /// trigger next keeper retry
-            return CommitRetryContext::UNCERTAIN_COMMIT;
-        }
-    };
-
     auto get_quorum_ops = [&] (Coordination::Requests & ops)
     {
         /** If we need a quorum - create a node in which the quorum is monitored.
@@ -787,8 +762,25 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
         }
     };
 
-    auto commit_new_part_stage = [&] () -> CommitRetryContext::Stages
+    auto commit_new_part_stage = [&]() -> CommitRetryContext::Stages
     {
+        if (storage.is_readonly)
+        {
+            /// stop retries if in shutdown
+            if (storage.shutdown_prepared_called)
+                throw Exception(
+                    ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to shutdown: replica_path={}", storage.replica_path);
+
+            /// When we attach existing parts it's okay to be in read-only mode
+            /// For example during RESTORE REPLICA.
+            if (!writing_existing_part)
+            {
+                retries_ctl.setUserError(
+                    Exception(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode: replica_path={}", storage.replica_path));
+                return CommitRetryContext::LOCK_AND_COMMIT;
+            }
+        }
+
         if constexpr (async_insert)
         {
             /// prefilter by cache
@@ -799,7 +791,8 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
             }
         }
 
-        LOG_INFO(log, "commit_new_part_stage");
+        /// Save the current temporary path in case we need to revert the change to retry (ZK connection loss)
+        const String temporary_part_relative_path = part->getDataPartStorage().getPartDirectory();
 
         /// Obtain incremental block number and lock it. The lock holds our intention to add the block to the filesystem.
         /// We remove the lock just after renaming the part. In case of exception, block number will be marked as abandoned.
@@ -833,8 +826,6 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
 
         auto block_number = block_number_lock->getNumber();
 
-        LOG_INFO(log, "lock_part_number_stage {}", block_number);
-
         /// Set part attributes according to part_number.
         part->info.min_block = block_number;
         part->info.max_block = block_number;
@@ -885,15 +876,7 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
 
         ThreadFuzzer::maybeInjectSleep();
 
-        fiu_do_on(FailPoints::replicated_merge_tree_commit_zk_fail_after_op,
-                  {
-                      if (!zookeeper->fault_policy)
-                      {
-                          zookeeper->logger = log;
-                          zookeeper->fault_policy = std::make_unique<RandomFaultInjection>(0, 0);
-                      }
-                      zookeeper->fault_policy->must_fail_after_op = true;
-                  });
+        fiu_do_on(FailPoints::replicated_merge_tree_commit_zk_fail_after_op, { zookeeper->forceFailureAfterOperation(); });
 
         Coordination::Responses responses;
         Coordination::Error multi_code = zookeeper->tryMultiNoThrow(ops, responses); /// 1 RTT
@@ -911,14 +894,57 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
 
         if (Coordination::isHardwareError(multi_code))
         {
-            retry_context.uncertain_keeper_error = multi_code;
+            LOG_DEBUG(
+                log, "Insert of part {} failed when committing to keeper (Reason: {}). Attempting to recover it", part->name, multi_code);
+            ZooKeeperRetriesControl new_retry_controller = retries_ctl;
 
-            /** If the connection is lost, and we do not know if the changes were applied, we can not delete the local part
-             *  if the changes were applied, the inserted block appeared in `/blocks/`, and it can not be inserted again.
-             */
-            sleep_before_commit_for_tests();
-            transaction.commit();
-            return CommitRetryContext::UNCERTAIN_COMMIT;
+            /// We are going to try to verify if the transaction was written into keeper
+            /// If we fail to do so (keeper unavailable) then we don't know if the changes were applied or not so
+            /// we can't delete the local part, as if the changes were applied then inserted block appeared in
+            /// `/blocks/`, and it can not be inserted again.
+            new_retry_controller.actionAfterLastFailedRetry([&]
+            {
+                transaction.commit();
+                storage.enqueuePartForCheck(part->name, MAX_AGE_OF_LOCAL_PART_THAT_WASNT_ADDED_TO_ZOOKEEPER);
+                throw Exception(ErrorCodes::UNKNOWN_STATUS_OF_INSERT,
+                        "Unknown status of part {} (Reason: {}). Data was written locally but we don't know the status in keeper. "
+                        "The status will be verified automatically in ~{} seconds (the part will be kept if present in keeper or dropped if not)",
+                        part->name, multi_code, MAX_AGE_OF_LOCAL_PART_THAT_WASNT_ADDED_TO_ZOOKEEPER);
+            });
+
+            bool node_exists = false;
+            /// The loop will be executed at least once
+            new_retry_controller.retryLoop([&]
+            {
+                fiu_do_on(FailPoints::replicated_merge_tree_commit_zk_fail_when_recovering_from_hw_fault, { zookeeper->forceFailureBeforeOperation(); });
+                zookeeper->setKeeper(storage.getZooKeeper());
+                node_exists = zookeeper->exists(fs::path(storage.replica_path) / "parts" / part->name);
+            });
+
+            if (node_exists)
+            {
+                LOG_DEBUG(log, "Insert of part {} recovered from keeper successfully. It will be committed", part->name);
+                part->new_part_was_committed_to_zookeeper_after_rename_on_disk = true;
+                sleep_before_commit_for_tests();
+                transaction.commit();
+                block_number_lock->assumeUnlocked();
+                return CommitRetryContext::SUCCESS;
+            }
+            else
+            {
+                LOG_DEBUG(log, "Insert of part {} was not committed to keeper. Will try again with a new block", part->name);
+                /// We checked in keeper and the the data in ops being written so we can retry the process again, but
+                /// there is a caveat: as we lost the connection the block number that we got (EphemeralSequential)
+                /// might or might not be there (and it belongs to a different session anyway) so we need to assume
+                /// it's not there and will be removed automatically, and start from scratch
+                /// In order to start from scratch we need to undo the changes that we've done as part of the
+                /// transaction: renameTempPartAndAdd
+                transaction.rollbackPartsToTemporaryState();
+                part->is_temp = true;
+                part->renameTo(temporary_part_relative_path, false);
+                /// Throw an exception to set the proper keeper error and force a retry (if possible)
+                zkutil::KeeperMultiException::check(multi_code, ops, responses);
+            }
         }
 
         transaction.rollback();
@@ -987,13 +1013,8 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
                 case CommitRetryContext::DUPLICATED_PART:
                     retry_context.stage = resolve_duplicate_stage();
                     break;
-                case CommitRetryContext::UNCERTAIN_COMMIT:
-                    retry_context.stage = resolve_uncertain_commit_stage();
-                    break;
                 case CommitRetryContext::SUCCESS:
-                    throw Exception(ErrorCodes::LOGICAL_ERROR,
-                                    "Operation is already succeed.");
-
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "Operation is already succeed.");
                 case CommitRetryContext::ERROR:
                     throw Exception(ErrorCodes::LOGICAL_ERROR,
                                     "Operation is already in error state.");
@@ -1016,22 +1037,6 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
     {
         zookeeper->setKeeper(storage.getZooKeeper());
 
-        if (storage.is_readonly)
-        {
-            /// stop retries if in shutdown
-            if (storage.shutdown_prepared_called)
-                throw Exception(
-                    ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode due to shutdown: replica_path={}", storage.replica_path);
-
-            /// When we attach existing parts it's okay to be in read-only mode
-            /// For example during RESTORE REPLICA.
-            if (!writing_existing_part)
-            {
-                retries_ctl.setUserError(ErrorCodes::TABLE_IS_READ_ONLY, "Table is in readonly mode: replica_path={}", storage.replica_path);
-                return;
-            }
-        }
-
         while (true)
         {
             const auto prev_stage = retry_context.stage;
@@ -1051,8 +1056,7 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
                 return;
             }
         }
-    },
-    [&zookeeper]() { zookeeper->cleanupEphemeralNodes(); });
+    });
 
     if (!retry_context.conflict_block_ids.empty())
         return {retry_context.conflict_block_ids, false};
@@ -1067,7 +1071,26 @@ std::pair<std::vector<String>, bool> ReplicatedMergeTreeSinkImpl<async_insert>::
             if (quorum_parallel)
                 quorum_info.status_path = storage.zookeeper_path + "/quorum/parallel/" + retry_context.actual_part_name;
 
-            waitForQuorum(zookeeper, retry_context.actual_part_name, quorum_info.status_path, quorum_info.is_active_node_version, replicas_num);
+            ZooKeeperRetriesControl new_retry_controller = retries_ctl;
+            new_retry_controller.actionAfterLastFailedRetry([&]
+            {
+                /// We do not know whether or not data has been inserted in other replicas
+                new_retry_controller.setUserError(Exception(
+                    ErrorCodes::UNKNOWN_STATUS_OF_INSERT,
+                    "Unknown quorum status. The data was inserted in the local replica but we could not verify quorum. Reason: {}",
+                    new_retry_controller.getLastKeeperErrorMessage()));
+            });
+
+            new_retry_controller.retryLoop([&]()
+            {
+                zookeeper->setKeeper(storage.getZooKeeper());
+                waitForQuorum(
+                    zookeeper,
+                    retry_context.actual_part_name,
+                    quorum_info.status_path,
+                    quorum_info.is_active_node_version,
+                    replicas_num);
+            });
         }
     }
 
@@ -1100,57 +1123,44 @@ void ReplicatedMergeTreeSinkImpl<async_insert>::waitForQuorum(
     /// We are waiting for quorum to be satisfied.
     LOG_TRACE(log, "Waiting for quorum '{}' for part {}{}", quorum_path, part_name, quorumLogMessage(replicas_num));
 
-    try
+    fiu_do_on(FailPoints::replicated_merge_tree_insert_quorum_fail_0, { zookeeper->forceFailureBeforeOperation(); });
+
+    while (true)
     {
-        fiu_do_on(FailPoints::replicated_merge_tree_insert_quorum_fail_0,
-        {
-            if (!zookeeper->fault_policy)
-            {
-                zookeeper->logger = log;
-                zookeeper->fault_policy = std::make_unique<RandomFaultInjection>(0, 0);
-            }
-            zookeeper->fault_policy->must_fail_before_op = true;
-        });
+        zkutil::EventPtr event = std::make_shared<Poco::Event>();
 
-        while (true)
-        {
-            zkutil::EventPtr event = std::make_shared<Poco::Event>();
+        std::string value;
+        /// `get` instead of `exists` so that `watch` does not leak if the node is no longer there.
+        if (!zookeeper->tryGet(quorum_path, value, nullptr, event))
+            break;
 
-            std::string value;
-            /// `get` instead of `exists` so that `watch` does not leak if the node is no longer there.
-            if (!zookeeper->tryGet(quorum_path, value, nullptr, event))
-                break;
+        LOG_TRACE(log, "Quorum node {} still exists, will wait for updates", quorum_path);
 
-            LOG_TRACE(log, "Quorum node {} still exists, will wait for updates", quorum_path);
+        ReplicatedMergeTreeQuorumEntry quorum_entry(value);
 
-            ReplicatedMergeTreeQuorumEntry quorum_entry(value);
+        /// If the node has time to disappear, and then appear again for the next insert.
+        if (quorum_entry.part_name != part_name)
+            break;
 
-            /// If the node has time to disappear, and then appear again for the next insert.
-            if (quorum_entry.part_name != part_name)
-                break;
+        if (!event->tryWait(quorum_timeout_ms))
+            throw Exception(
+                ErrorCodes::UNKNOWN_STATUS_OF_INSERT,
+                "Unknown quorum status. The data was inserted in the local replica but we could not verify quorum. Reason: "
+                "Timeout while waiting for quorum");
 
-            if (!event->tryWait(quorum_timeout_ms))
-                throw Exception(ErrorCodes::TIMEOUT_EXCEEDED, "Timeout while waiting for quorum");
-
-            LOG_TRACE(log, "Quorum {} for part {} updated, will check quorum node still exists", quorum_path, part_name);
-        }
-
-        /// And what if it is possible that the current replica at this time has ceased to be active
-        /// and the quorum is marked as failed and deleted?
-        Coordination::Stat stat;
-        String value;
-        if (!zookeeper->tryGet(storage.replica_path + "/is_active", value, &stat)
-            || stat.version != is_active_node_version)
-            throw Exception(ErrorCodes::NO_ACTIVE_REPLICAS, "Replica become inactive while waiting for quorum");
-    }
-    catch (...)
-    {
-        /// We do not know whether or not data has been inserted
-        /// - whether other replicas have time to download the part and mark the quorum as done.
-        throw Exception(ErrorCodes::UNKNOWN_STATUS_OF_INSERT, "Unknown status, client must retry. Reason: {}",
-            getCurrentExceptionMessage(false));
+        LOG_TRACE(log, "Quorum {} for part {} updated, will check quorum node still exists", quorum_path, part_name);
     }
 
+    /// And what if it is possible that the current replica at this time has ceased to be active
+    /// and the quorum is marked as failed and deleted?
+    Coordination::Stat stat;
+    String value;
+    if (!zookeeper->tryGet(storage.replica_path + "/is_active", value, &stat) || stat.version != is_active_node_version)
+        throw Exception(
+            ErrorCodes::UNKNOWN_STATUS_OF_INSERT,
+            "Unknown quorum status. The data was inserted in the local replica but we could not verify quorum. Reason: "
+            "Replica became inactive while waiting for quorum");
+
     LOG_TRACE(log, "Quorum '{}' for part {} satisfied", quorum_path, part_name);
 }
 
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeSink.h b/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
index ded35aa015b..5c70d0c76e1 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeSink.h
@@ -74,7 +74,6 @@ private:
 
     using BlockIDsType = std::conditional_t<async_insert, std::vector<String>, String>;
 
-    ZooKeeperRetriesInfo zookeeper_retries_info;
     struct QuorumInfo
     {
         String status_path;
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp
index 41ff93e28f7..41188891118 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.cpp
@@ -6,6 +6,9 @@
 #include <Parsers/ExpressionListParsers.h>
 #include <IO/Operators.h>
 #include <Interpreters/FunctionNameNormalizer.h>
+#include <Common/SipHash.h>
+#include <IO/WriteBufferFromString.h>
+#include <IO/WriteHelpers.h>
 
 
 namespace DB
@@ -49,6 +52,17 @@ ReplicatedMergeTreeTableMetadata::ReplicatedMergeTreeTableMetadata(const MergeTr
     index_granularity = data_settings->index_granularity;
     merging_params_mode = static_cast<int>(data.merging_params.mode);
     sign_column = data.merging_params.sign_column;
+    is_deleted_column = data.merging_params.is_deleted_column;
+    columns_to_sum = fmt::format("{}", fmt::join(data.merging_params.columns_to_sum.begin(), data.merging_params.columns_to_sum.end(), ","));
+    version_column = data.merging_params.version_column;
+    if (data.merging_params.mode == MergeTreeData::MergingParams::Graphite)
+    {
+        SipHash graphite_hash;
+        data.merging_params.graphite_params.updateHash(graphite_hash);
+        WriteBufferFromOwnString wb;
+        writeText(graphite_hash.get128(), wb);
+        graphite_params_hash = std::move(wb.str());
+    }
 
     /// This code may looks strange, but previously we had only one entity: PRIMARY KEY (or ORDER BY, it doesn't matter)
     /// Now we have two different entities ORDER BY and it's optional prefix -- PRIMARY KEY.
@@ -90,6 +104,22 @@ ReplicatedMergeTreeTableMetadata::ReplicatedMergeTreeTableMetadata(const MergeTr
 
 void ReplicatedMergeTreeTableMetadata::write(WriteBuffer & out) const
 {
+    /// Important notes: new added field must always be append to the end of serialized metadata
+    /// for backward compatible.
+
+    /// In addition, two consecutive fields should not share any prefix, otherwise deserialize may fails.
+    /// For example, if you have two field `v1` and `v2` serialized as:
+    ///     if (!v1.empty()) out << "v1: " << v1 << "\n";
+    ///     if (!v2.empty()) out << "v2: " << v2 << "\n";
+    /// Let say if `v1` is empty and v2 is non-empty, then `v1` is not in serialized metadata.
+    /// Later, to deserialize the metadata, `read` will sequentially check if each field with `checkString`.
+    /// When it begin to check for `v1` and `v2`, the metadata buffer look like this:
+    ///     v2: <v2 value>
+    ///     ^
+    ///   cursor
+    /// `checkString("v1: ", in)` will be called first and it moves the cursor to `2` instead of `v`, so the
+    /// subsequent call `checkString("v2: ", in)` will also fails.
+
     out << "metadata format version: 1\n"
         << "date column: " << date_column << "\n"
         << "sampling expression: " << sampling_expression << "\n"
@@ -121,6 +151,19 @@ void ReplicatedMergeTreeTableMetadata::write(WriteBuffer & out) const
 
     if (!constraints.empty())
         out << "constraints: " << constraints << "\n";
+
+    if (merge_params_version >= REPLICATED_MERGE_TREE_METADATA_WITH_ALL_MERGE_PARAMETERS)
+    {
+        out << "merge parameters format version: " << merge_params_version << "\n";
+        if (!version_column.empty())
+            out << "version column: " << version_column << "\n";
+        if (!is_deleted_column.empty())
+            out << "is_deleted column: " << is_deleted_column << "\n";
+        if (!columns_to_sum.empty())
+            out << "columns to sum: " << columns_to_sum << "\n";
+        if (!graphite_params_hash.empty())
+            out << "graphite hash: " << graphite_params_hash << "\n";
+    }
 }
 
 String ReplicatedMergeTreeTableMetadata::toString() const
@@ -170,6 +213,26 @@ void ReplicatedMergeTreeTableMetadata::read(ReadBuffer & in)
 
     if (checkString("constraints: ", in))
         in >> constraints >> "\n";
+
+    if (checkString("merge parameters format version: ", in))
+        in >> merge_params_version >> "\n";
+    else
+        merge_params_version = REPLICATED_MERGE_TREE_METADATA_LEGACY_VERSION;
+
+    if (merge_params_version >= REPLICATED_MERGE_TREE_METADATA_WITH_ALL_MERGE_PARAMETERS)
+    {
+        if (checkString("version column: ", in))
+            in >> version_column >> "\n";
+
+        if (checkString("is_deleted column: ", in))
+            in >> is_deleted_column >> "\n";
+
+        if (checkString("columns to sum: ", in))
+            in >> columns_to_sum >> "\n";
+
+        if (checkString("graphite hash: ", in))
+            in >> graphite_params_hash >> "\n";
+    }
 }
 
 ReplicatedMergeTreeTableMetadata ReplicatedMergeTreeTableMetadata::parse(const String & s)
@@ -210,6 +273,25 @@ void ReplicatedMergeTreeTableMetadata::checkImmutableFieldsEquals(const Replicat
         throw Exception(ErrorCodes::METADATA_MISMATCH, "Existing table metadata in ZooKeeper differs in sign column. "
             "Stored in ZooKeeper: {}, local: {}", from_zk.sign_column, sign_column);
 
+    if (merge_params_version >= REPLICATED_MERGE_TREE_METADATA_WITH_ALL_MERGE_PARAMETERS && from_zk.merge_params_version >= REPLICATED_MERGE_TREE_METADATA_WITH_ALL_MERGE_PARAMETERS)
+    {
+        if (version_column != from_zk.version_column)
+            throw Exception(ErrorCodes::METADATA_MISMATCH, "Existing table metadata in ZooKeeper differs in version column. "
+                "Stored in ZooKeeper: {}, local: {}", from_zk.version_column, version_column);
+
+        if (is_deleted_column != from_zk.is_deleted_column)
+            throw Exception(ErrorCodes::METADATA_MISMATCH, "Existing table metadata in ZooKeeper differs in is_deleted column. "
+                "Stored in ZooKeeper: {}, local: {}", from_zk.is_deleted_column, is_deleted_column);
+
+        if (columns_to_sum != from_zk.columns_to_sum)
+            throw Exception(ErrorCodes::METADATA_MISMATCH, "Existing table metadata in ZooKeeper differs in sum columns. "
+                "Stored in ZooKeeper: {}, local: {}", from_zk.columns_to_sum, columns_to_sum);
+
+        if (graphite_params_hash != from_zk.graphite_params_hash)
+            throw Exception(ErrorCodes::METADATA_MISMATCH, "Existing table metadata in ZooKeeper differs in graphite params. "
+                "Stored in ZooKeeper hash: {}, local hash: {}", from_zk.graphite_params_hash, graphite_params_hash);
+    }
+
     /// NOTE: You can make a less strict check of match expressions so that tables do not break from small changes
     ///    in formatAST code.
     String parsed_zk_primary_key = formattedAST(KeyDescription::parse(from_zk.primary_key, columns, context).expression_list_ast);
@@ -409,7 +491,7 @@ StorageInMemoryMetadata ReplicatedMergeTreeTableMetadata::Diff::getNewMetadata(c
                 ParserTTLExpressionList parser;
                 auto ttl_for_table_ast = parseQuery(parser, new_ttl_table, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
                 new_metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(
-                    ttl_for_table_ast, new_metadata.columns, context, new_metadata.primary_key);
+                    ttl_for_table_ast, new_metadata.columns, context, new_metadata.primary_key, true /* allow_suspicious; because it is replication */);
             }
             else /// TTL was removed
             {
@@ -422,7 +504,7 @@ StorageInMemoryMetadata ReplicatedMergeTreeTableMetadata::Diff::getNewMetadata(c
     new_metadata.column_ttls_by_name.clear();
     for (const auto & [name, ast] : new_metadata.columns.getColumnTTLs())
     {
-        auto new_ttl_entry = TTLDescription::getTTLFromAST(ast, new_metadata.columns, context, new_metadata.primary_key);
+        auto new_ttl_entry = TTLDescription::getTTLFromAST(ast, new_metadata.columns, context, new_metadata.primary_key, true /* allow_suspicious; because it is replication */);
         new_metadata.column_ttls_by_name[name] = new_ttl_entry;
     }
 
@@ -454,7 +536,7 @@ StorageInMemoryMetadata ReplicatedMergeTreeTableMetadata::Diff::getNewMetadata(c
 
     if (!ttl_table_changed && new_metadata.table_ttl.definition_ast != nullptr)
         new_metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(
-            new_metadata.table_ttl.definition_ast, new_metadata.columns, context, new_metadata.primary_key);
+            new_metadata.table_ttl.definition_ast, new_metadata.columns, context, new_metadata.primary_key, true /* allow_suspicious; because it is replication */);
 
     if (!projections_changed)
     {
diff --git a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h
index eb2d087e988..15ed8671f9b 100644
--- a/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h
+++ b/src/Storages/MergeTree/ReplicatedMergeTreeTableMetadata.h
@@ -4,6 +4,7 @@
 #include <Storages/MergeTree/MergeTreeDataFormatVersion.h>
 #include <base/types.h>
 #include <Storages/StorageInMemoryMetadata.h>
+#include <IO/ReadBufferFromString.h>
 
 namespace DB
 {
@@ -17,11 +18,20 @@ class ReadBuffer;
  */
 struct ReplicatedMergeTreeTableMetadata
 {
+    static constexpr int REPLICATED_MERGE_TREE_METADATA_LEGACY_VERSION = 1;
+    static constexpr int REPLICATED_MERGE_TREE_METADATA_WITH_ALL_MERGE_PARAMETERS = 2;
+
     String date_column;
     String sampling_expression;
     UInt64 index_granularity;
+    /// Merging related params
     int merging_params_mode;
+    int merge_params_version = REPLICATED_MERGE_TREE_METADATA_WITH_ALL_MERGE_PARAMETERS;
     String sign_column;
+    String version_column;
+    String is_deleted_column;
+    String columns_to_sum;
+    String graphite_params_hash;
     String primary_key;
     MergeTreeDataFormatVersion data_format_version;
     String partition_key;
diff --git a/src/Storages/MergeTree/StorageFromMergeTreeDataPart.h b/src/Storages/MergeTree/StorageFromMergeTreeDataPart.h
index 96b211085c1..6606e4d738e 100644
--- a/src/Storages/MergeTree/StorageFromMergeTreeDataPart.h
+++ b/src/Storages/MergeTree/StorageFromMergeTreeDataPart.h
@@ -86,18 +86,10 @@ public:
 
     bool supportsPrewhere() const override { return true; }
 
-    bool supportsIndexForIn() const override { return true; }
-
     bool supportsDynamicSubcolumns() const override { return true; }
 
     bool supportsSubcolumns() const override { return true; }
 
-    bool mayBenefitFromIndexForIn(
-        const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & metadata_snapshot) const override
-    {
-        return storage.mayBenefitFromIndexForIn(left_in_operand, query_context, metadata_snapshot);
-    }
-
     NamesAndTypesList getVirtuals() const override
     {
         return storage.getVirtuals();
diff --git a/src/Storages/MergeTree/ZooKeeperRetries.h b/src/Storages/MergeTree/ZooKeeperRetries.h
index e46c3f974c7..22282345220 100644
--- a/src/Storages/MergeTree/ZooKeeperRetries.h
+++ b/src/Storages/MergeTree/ZooKeeperRetries.h
@@ -5,6 +5,8 @@
 #include <Common/ZooKeeper/KeeperException.h>
 #include <Common/logger_useful.h>
 
+#include <memory>
+
 namespace DB
 {
 
@@ -15,29 +17,31 @@ namespace ErrorCodes
 
 struct ZooKeeperRetriesInfo
 {
-    ZooKeeperRetriesInfo() = default;
-    ZooKeeperRetriesInfo(std::string name_, Poco::Logger * logger_, UInt64 max_retries_, UInt64 initial_backoff_ms_, UInt64 max_backoff_ms_)
-        : name(std::move(name_))
-        , logger(logger_)
-        , max_retries(max_retries_)
-        , curr_backoff_ms(std::min(initial_backoff_ms_, max_backoff_ms_))
-        , max_backoff_ms(max_backoff_ms_)
+    ZooKeeperRetriesInfo(UInt64 max_retries_, UInt64 initial_backoff_ms_, UInt64 max_backoff_ms_)
+        : max_retries(max_retries_), initial_backoff_ms(std::min(initial_backoff_ms_, max_backoff_ms_)), max_backoff_ms(max_backoff_ms_)
     {
     }
 
-    std::string name;
-    Poco::Logger * logger = nullptr;
-    UInt64 max_retries = 0;
-    UInt64 curr_backoff_ms = 0;
-    UInt64 max_backoff_ms = 0;
-    UInt64 retry_count = 0;
+    UInt64 max_retries;
+    UInt64 initial_backoff_ms;
+    UInt64 max_backoff_ms;
 };
 
 class ZooKeeperRetriesControl
 {
 public:
-    ZooKeeperRetriesControl(std::string name_, ZooKeeperRetriesInfo & retries_info_, QueryStatusPtr elem)
-        : name(std::move(name_)), retries_info(retries_info_), process_list_element(elem)
+    ZooKeeperRetriesControl(std::string name_, Poco::Logger * logger_, ZooKeeperRetriesInfo retries_info_, QueryStatusPtr elem)
+        : name(std::move(name_)), logger(logger_), retries_info(retries_info_), process_list_element(elem)
+    {
+    }
+
+    ZooKeeperRetriesControl(const ZooKeeperRetriesControl & other)
+        : name(other.name)
+        , logger(other.logger)
+        , retries_info(other.retries_info)
+        , total_failures(other.total_failures)
+        , process_list_element(other.process_list_element)
+        , current_backoff_ms(other.current_backoff_ms)
     {
     }
 
@@ -46,7 +50,7 @@ public:
         retryLoop(f, []() {});
     }
 
-    /// retryLoop() executes f() until it succeeds/max_retries is reached/non-retrialable error is encountered
+    /// retryLoop() executes f() until it succeeds/max_retries is reached/non-retryable error is encountered
     ///
     /// the callable f() can provide feedback in terms of errors in two ways:
     /// 1. throw KeeperException exception:
@@ -56,10 +60,17 @@ public:
     ///     The idea is that if the caller has some semantics on top of non-hardware keeper errors,
     ///     then it can provide feedback to retries controller via user errors
     ///
+    /// It is possible to use it multiple times (it will share nº of errors over the total amount of calls)
+    /// Each retryLoop is independent and it will execute f at least once
     void retryLoop(auto && f, auto && iteration_cleanup)
     {
-        while (canTry())
+        current_iteration = 0;
+        current_backoff_ms = retries_info.initial_backoff_ms;
+
+        while (current_iteration == 0 || canTry())
         {
+            /// reset the flag, it will be set to false in case of error
+            iteration_succeeded = true;
             try
             {
                 f();
@@ -79,6 +90,7 @@ public:
                 iteration_cleanup();
                 throw;
             }
+            current_iteration++;
         }
     }
 
@@ -100,15 +112,13 @@ public:
         return false;
     }
 
-    void setUserError(std::exception_ptr exception, int code, std::string message)
+    void setUserError(std::exception_ptr exception, int code, const std::string & message)
     {
-        if (retries_info.logger)
-            LOG_TRACE(
-                retries_info.logger, "ZooKeeperRetriesControl: {}/{}: setUserError: error={} message={}", retries_info.name, name, code, message);
+        if (logger)
+            LOG_TRACE(logger, "ZooKeeperRetriesControl: {}: setUserError: error={} message={}", name, code, message);
 
-        /// if current iteration is already failed, keep initial error
-        if (!iteration_succeeded)
-            return;
+        if (iteration_succeeded)
+            total_failures++;
 
         iteration_succeeded = false;
         user_error.code = code;
@@ -117,32 +127,18 @@ public:
         keeper_error = KeeperError{};
     }
 
-    template <typename... Args>
-    void setUserError(std::exception_ptr exception, int code, fmt::format_string<Args...> fmt, Args &&... args)
+    void setUserError(const Exception & exception)
     {
-        setUserError(exception, code, fmt::format(fmt, std::forward<Args>(args)...));
-    }
-
-    void setUserError(int code, std::string message)
-    {
-        setUserError(std::make_exception_ptr(Exception::createDeprecated(message, code)), code, message);
-    }
-
-    template <typename... Args>
-    void setUserError(int code, fmt::format_string<Args...> fmt, Args &&... args)
-    {
-        setUserError(code, fmt::format(fmt, std::forward<Args>(args)...));
+        setUserError(std::make_exception_ptr(exception), exception.code(), exception.message());
     }
 
     void setKeeperError(std::exception_ptr exception, Coordination::Error code, std::string message)
     {
-        if (retries_info.logger)
-            LOG_TRACE(
-                retries_info.logger, "ZooKeeperRetriesControl: {}/{}: setKeeperError: error={} message={}", retries_info.name, name, code, message);
+        if (logger)
+            LOG_TRACE(logger, "ZooKeeperRetriesControl: {}: setKeeperError: error={} message={}", name, code, message);
 
-        /// if current iteration is already failed, keep initial error
-        if (!iteration_succeeded)
-            return;
+        if (iteration_succeeded)
+            total_failures++;
 
         iteration_succeeded = false;
         keeper_error.code = code;
@@ -151,36 +147,21 @@ public:
         user_error = UserError{};
     }
 
-    template <typename... Args>
-    void setKeeperError(std::exception_ptr exception, Coordination::Error code, fmt::format_string<Args...> fmt, Args &&... args)
-    {
-        setKeeperError(exception, code, fmt::format(fmt, std::forward<Args>(args)...));
-    }
-
-    void setKeeperError(Coordination::Error code, std::string message)
-    {
-        setKeeperError(std::make_exception_ptr(zkutil::KeeperException::createDeprecated(message, code)), code, message);
-    }
-
-    template <typename... Args>
-    void setKeeperError(Coordination::Error code, fmt::format_string<Args...> fmt, Args &&... args)
-    {
-        setKeeperError(code, fmt::format(fmt, std::forward<Args>(args)...));
-    }
-
     void stopRetries() { stop_retries = true; }
 
-    void requestUnconditionalRetry() { unconditional_retry = true; }
+    bool isLastRetry() const { return total_failures >= retries_info.max_retries; }
 
-    bool isLastRetry() const { return retries_info.retry_count >= retries_info.max_retries; }
+    bool isRetry() const { return current_iteration > 1; }
 
-    bool isRetry() const { return retries_info.retry_count > 0; }
-
-    Coordination::Error getLastKeeperErrorCode() const { return keeper_error.code; }
+    const std::string & getLastKeeperErrorMessage() const { return keeper_error.message; }
 
     /// action will be called only once and only after latest failed retry
     void actionAfterLastFailedRetry(std::function<void()> f) { action_after_last_failed_retry = std::move(f); }
 
+    const std::string & getName() const { return name; }
+
+    Poco::Logger * getLogger() const { return logger; }
+
 private:
     struct KeeperError
     {
@@ -199,59 +180,42 @@ private:
 
     bool canTry()
     {
-        ++iteration_count;
-        /// first iteration is ordinary execution, no further checks needed
-        if (0 == iteration_count)
-            return true;
-
-        if (process_list_element && !process_list_element->checkTimeLimitSoft())
-            return false;
-
-        if (unconditional_retry)
-        {
-            unconditional_retry = false;
-            return true;
-        }
-
-        /// iteration succeeded -> no need to retry
         if (iteration_succeeded)
         {
-            /// avoid unnecessary logs, - print something only in case of retries
-            if (retries_info.logger && iteration_count > 1)
+            if (logger && total_failures > 0)
                 LOG_DEBUG(
-                    retries_info.logger,
-                    "ZooKeeperRetriesControl: {}/{}: succeeded after: iterations={} total_retries={}",
-                    retries_info.name,
+                    logger,
+                    "ZooKeeperRetriesControl: {}: succeeded after: Iterations={} Total keeper failures={}/{}",
                     name,
-                    iteration_count,
-                    retries_info.retry_count);
+                    current_iteration,
+                    total_failures,
+                    retries_info.max_retries);
             return false;
         }
 
         if (stop_retries)
         {
-            logLastError("stop retries on request");
             action_after_last_failed_retry();
+            logLastError("stop retries on request");
             throwIfError();
             return false;
         }
 
-        if (retries_info.retry_count >= retries_info.max_retries)
+        if (total_failures > retries_info.max_retries)
         {
-            logLastError("retry limit is reached");
             action_after_last_failed_retry();
+            logLastError("retry limit is reached");
             throwIfError();
             return false;
         }
 
+        if (process_list_element && !process_list_element->checkTimeLimitSoft())
+            return false;
+
         /// retries
-        ++retries_info.retry_count;
         logLastError("will retry due to error");
-        sleepForMilliseconds(retries_info.curr_backoff_ms);
-        retries_info.curr_backoff_ms = std::min(retries_info.curr_backoff_ms * 2, retries_info.max_backoff_ms);
-
-        /// reset the flag, it will be set to false in case of error
-        iteration_succeeded = true;
+        sleepForMilliseconds(current_backoff_ms);
+        current_backoff_ms = std::min(current_backoff_ms * 2, retries_info.max_backoff_ms);
 
         return true;
     }
@@ -265,49 +229,52 @@ private:
             std::rethrow_exception(keeper_error.exception);
     }
 
-    void logLastError(std::string_view header)
+    void logLastError(const std::string_view & header)
     {
+        if (!logger)
+            return;
         if (user_error.code == ErrorCodes::OK)
         {
-            if (retries_info.logger)
-                LOG_DEBUG(
-                    retries_info.logger,
-                    "ZooKeeperRetriesControl: {}/{}: {}: retry_count={} timeout={}ms error={} message={}",
-                    retries_info.name,
-                    name,
-                    header,
-                    retries_info.retry_count,
-                    retries_info.curr_backoff_ms,
-                    keeper_error.code,
-                    keeper_error.message);
+            LOG_DEBUG(
+                logger,
+                "ZooKeeperRetriesControl: {}: {}: retry_count={}/{} timeout={}ms error={} message={}",
+                name,
+                header,
+                current_iteration,
+                retries_info.max_retries,
+                current_backoff_ms,
+                keeper_error.code,
+                keeper_error.message);
         }
         else
         {
-            if (retries_info.logger)
-                LOG_DEBUG(
-                    retries_info.logger,
-                    "ZooKeeperRetriesControl: {}/{}: {}: retry_count={} timeout={}ms error={} message={}",
-                    retries_info.name,
-                    name,
-                    header,
-                    retries_info.retry_count,
-                    retries_info.curr_backoff_ms,
-                    user_error.code,
-                    user_error.message);
+            LOG_DEBUG(
+                logger,
+                "ZooKeeperRetriesControl: {}: {}: retry_count={}/{} timeout={}ms error={} message={}",
+                name,
+                header,
+                current_iteration,
+                retries_info.max_retries,
+                current_backoff_ms,
+                user_error.code,
+                user_error.message);
         }
     }
 
 
     std::string name;
-    ZooKeeperRetriesInfo & retries_info;
-    Int64 iteration_count = -1;
+    Poco::Logger * logger = nullptr;
+    ZooKeeperRetriesInfo retries_info;
+    UInt64 total_failures = 0;
     UserError user_error;
     KeeperError keeper_error;
     std::function<void()> action_after_last_failed_retry = []() {};
-    bool unconditional_retry = false;
     bool iteration_succeeded = true;
     bool stop_retries = false;
     QueryStatusPtr process_list_element;
+
+    UInt64 current_iteration = 0;
+    UInt64 current_backoff_ms = 0;
 };
 
 }
diff --git a/src/Storages/MergeTree/checkDataPart.cpp b/src/Storages/MergeTree/checkDataPart.cpp
index a75df00e8a7..7e0b69c7638 100644
--- a/src/Storages/MergeTree/checkDataPart.cpp
+++ b/src/Storages/MergeTree/checkDataPart.cpp
@@ -16,6 +16,7 @@
 #include <IO/S3Common.h>
 #include <Common/CurrentMetrics.h>
 #include <Common/SipHash.h>
+#include <Common/ZooKeeper/IKeeper.h>
 #include <Poco/Net/NetException.h>
 
 #if USE_AZURE_BLOB_STORAGE
@@ -80,6 +81,11 @@ bool isRetryableException(const std::exception_ptr exception_ptr)
         if (e.getErrno() == EMFILE)
             return true;
     }
+    catch (const Coordination::Exception  & e)
+    {
+        if (Coordination::isHardwareError(e.code))
+            return true;
+    }
     catch (const Exception & e)
     {
         if (isNotEnoughMemoryErrorCode(e.code()))
@@ -335,7 +341,7 @@ IMergeTreeDataPart::Checksums checkDataPart(
             &Poco::Logger::get("checkDataPart"),
             "Will drop cache for data part {} and will check it once again", data_part->name);
 
-        auto & cache = *FileCacheFactory::instance().getByName(*cache_name).cache;
+        auto & cache = *FileCacheFactory::instance().getByName(*cache_name)->cache;
         for (auto it = data_part_storage.iterate(); it->isValid(); it->next())
         {
             auto file_name = it->name();
diff --git a/src/Storages/MergeTree/registerStorageMergeTree.cpp b/src/Storages/MergeTree/registerStorageMergeTree.cpp
index 3310b8cb72d..9a5af77d57c 100644
--- a/src/Storages/MergeTree/registerStorageMergeTree.cpp
+++ b/src/Storages/MergeTree/registerStorageMergeTree.cpp
@@ -581,10 +581,12 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         if (args.storage_def->sample_by)
             metadata.sampling_key = KeyDescription::getKeyFromAST(args.storage_def->sample_by->ptr(), metadata.columns, context);
 
+        bool allow_suspicious_ttl = args.attach || args.getLocalContext()->getSettingsRef().allow_suspicious_ttl_expressions;
+
         if (args.storage_def->ttl_table)
         {
             metadata.table_ttl = TTLTableDescription::getTTLForTableFromAST(
-                args.storage_def->ttl_table->ptr(), metadata.columns, context, metadata.primary_key);
+                args.storage_def->ttl_table->ptr(), metadata.columns, context, metadata.primary_key, allow_suspicious_ttl);
         }
 
         if (args.query.columns_list && args.query.columns_list->indices)
@@ -602,7 +604,7 @@ static StoragePtr create(const StorageFactory::Arguments & args)
         auto column_ttl_asts = columns.getColumnTTLs();
         for (const auto & [name, ast] : column_ttl_asts)
         {
-            auto new_ttl_entry = TTLDescription::getTTLFromAST(ast, columns, context, metadata.primary_key);
+            auto new_ttl_entry = TTLDescription::getTTLFromAST(ast, columns, context, metadata.primary_key, allow_suspicious_ttl);
             metadata.column_ttls_by_name[name] = new_ttl_entry;
         }
 
diff --git a/src/Storages/MutationCommands.cpp b/src/Storages/MutationCommands.cpp
index 03200d0d9fa..36388a32b41 100644
--- a/src/Storages/MutationCommands.cpp
+++ b/src/Storages/MutationCommands.cpp
@@ -59,6 +59,15 @@ std::optional<MutationCommand> MutationCommand::parse(ASTAlterCommand * command,
         }
         return res;
     }
+    else if (command->type == ASTAlterCommand::APPLY_DELETED_MASK)
+    {
+        MutationCommand res;
+        res.ast = command->ptr();
+        res.type = APPLY_DELETED_MASK;
+        res.predicate = command->predicate;
+        res.partition = command->partition;
+        return res;
+    }
     else if (command->type == ASTAlterCommand::MATERIALIZE_INDEX)
     {
         MutationCommand res;
diff --git a/src/Storages/MutationCommands.h b/src/Storages/MutationCommands.h
index 014a227dff3..6e10f7d9b2d 100644
--- a/src/Storages/MutationCommands.h
+++ b/src/Storages/MutationCommands.h
@@ -39,6 +39,7 @@ struct MutationCommand
         MATERIALIZE_TTL,
         RENAME_COLUMN,
         MATERIALIZE_COLUMN,
+        APPLY_DELETED_MASK,
         ALTER_WITHOUT_MUTATION, /// pure metadata command, currently unusned
     };
 
diff --git a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp
index e7bd6be7b2b..b2442109409 100644
--- a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp
+++ b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.cpp
@@ -22,6 +22,23 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
     extern const int POSTGRESQL_REPLICATION_INTERNAL_ERROR;
     extern const int BAD_ARGUMENTS;
+    extern const int ILLEGAL_COLUMN;
+}
+
+namespace
+{
+    using ArrayInfo = std::unordered_map<size_t, PostgreSQLArrayInfo>;
+
+    ArrayInfo createArrayInfos(const NamesAndTypesList & columns, const ExternalResultDescription & columns_description)
+    {
+        ArrayInfo array_info;
+        for (size_t i = 0; i < columns.size(); ++i)
+        {
+            if (columns_description.types[i].first == ExternalResultDescription::ValueType::vtArray)
+                preparePostgreSQLArrayInfo(array_info, i, columns_description.sample_block.getByPosition(i).type);
+        }
+        return array_info;
+    }
 }
 
 MaterializedPostgreSQLConsumer::MaterializedPostgreSQLConsumer(
@@ -40,126 +57,181 @@ MaterializedPostgreSQLConsumer::MaterializedPostgreSQLConsumer(
     , publication_name(publication_name_)
     , connection(connection_)
     , current_lsn(start_lsn)
+    , final_lsn(start_lsn)
     , lsn_value(getLSNValue(start_lsn))
     , max_block_size(max_block_size_)
     , schema_as_a_part_of_table_name(schema_as_a_part_of_table_name_)
 {
-    final_lsn = start_lsn;
-    auto tx = std::make_shared<pqxx::nontransaction>(connection->getRef());
-    current_lsn = advanceLSN(tx);
-    LOG_TRACE(log, "Starting replication. LSN: {} (last: {})", getLSNValue(current_lsn), getLSNValue(final_lsn));
-    tx->commit();
-
-    for (const auto & [table_name, storage_info] : storages_info_)
-        storages.emplace(table_name, storage_info);
-}
-
-
-MaterializedPostgreSQLConsumer::StorageData::StorageData(const StorageInfo & storage_info)
-    : storage(storage_info.storage), buffer(storage_info.storage->getInMemoryMetadataPtr(), storage_info.attributes)
-{
-    auto table_id = storage_info.storage->getStorageID();
-    LOG_TRACE(&Poco::Logger::get("StorageMaterializedPostgreSQL"),
-              "New buffer for table {}, number of attributes: {}, number if columns: {}, structure: {}",
-              table_id.getNameForLogs(), buffer.attributes.size(), buffer.getColumnsNum(), buffer.description.sample_block.dumpStructure());
-}
-
-
-MaterializedPostgreSQLConsumer::StorageData::Buffer::Buffer(
-    StorageMetadataPtr storage_metadata, const PostgreSQLTableStructure::Attributes & attributes_)
-    : attributes(attributes_)
-{
-    const Block sample_block = storage_metadata->getSampleBlock();
-
-    /// Need to clear type, because in description.init() the types are appended
-    description.types.clear();
-    description.init(sample_block);
-
-    columns = description.sample_block.cloneEmptyColumns();
-    const auto & storage_columns = storage_metadata->getColumns().getAllPhysical();
-    auto insert_columns = std::make_shared<ASTExpressionList>();
-
-    auto columns_num = description.sample_block.columns();
-    assert(columns_num == storage_columns.size());
-    if (attributes.size() + 2 != columns_num) /// +2 because sign and version columns
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "Columns number mismatch. Attributes: {}, buffer: {}",
-                        attributes.size(), columns_num);
-
-    size_t idx = 0;
-    for (const auto & column : storage_columns)
     {
-        if (description.types[idx].first == ExternalResultDescription::ValueType::vtArray)
-            preparePostgreSQLArrayInfo(array_info, idx, description.sample_block.getByPosition(idx).type);
-        idx++;
-
-        insert_columns->children.emplace_back(std::make_shared<ASTIdentifier>(column.name));
+        auto tx = std::make_shared<pqxx::nontransaction>(connection->getRef());
+        current_lsn = advanceLSN(tx);
+        tx->commit();
     }
 
-    columns_ast = std::move(insert_columns);
+    for (const auto & [table_name, storage_info] : storages_info_)
+        storages.emplace(table_name, StorageData(storage_info, log));
+
+    LOG_TRACE(log, "Starting replication. LSN: {} (last: {}), storages: {}",
+              getLSNValue(current_lsn), getLSNValue(final_lsn), storages.size());
 }
 
 
-void MaterializedPostgreSQLConsumer::assertCorrectInsertion(StorageData::Buffer & buffer, size_t column_idx)
+MaterializedPostgreSQLConsumer::StorageData::StorageData(const StorageInfo & storage_info, Poco::Logger * log_)
+    : storage(storage_info.storage)
+    , table_description(storage_info.storage->getInMemoryMetadataPtr()->getSampleBlock())
+    , columns_attributes(storage_info.attributes)
+    , column_names(storage_info.storage->getInMemoryMetadataPtr()->getColumns().getNamesOfPhysical())
+    , array_info(createArrayInfos(storage_info.storage->getInMemoryMetadataPtr()->getColumns().getAllPhysical(), table_description))
 {
-    if (column_idx >= buffer.description.sample_block.columns()
-        || column_idx >= buffer.description.types.size()
-        || column_idx >= buffer.columns.size())
-        throw Exception(
-                        ErrorCodes::LOGICAL_ERROR,
+    auto columns_num = table_description.sample_block.columns();
+    /// +2 because of _sign and _version columns
+    if (columns_attributes.size() + 2 != columns_num)
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
+                        "Columns number mismatch. Attributes: {}, buffer: {}",
+                        columns_attributes.size(), columns_num);
+    }
+
+    LOG_TRACE(log_, "Adding definition for table {}, structure: {}",
+              storage_info.storage->getStorageID().getNameForLogs(),
+              table_description.sample_block.dumpStructure());
+}
+
+MaterializedPostgreSQLConsumer::StorageData::Buffer::Buffer(
+    ColumnsWithTypeAndName && columns_,
+    const ExternalResultDescription & table_description_)
+{
+    if (columns_.end() != std::find_if(
+            columns_.begin(), columns_.end(),
+            [](const auto & col) { return col.name == "_sign" || col.name == "_version"; }))
+    {
+        throw Exception(ErrorCodes::ILLEGAL_COLUMN,
+                        "PostgreSQL table cannot contain `_sign` or `_version` columns "
+                        "as they are reserved for internal usage");
+    }
+
+    columns_.push_back(table_description_.sample_block.getByName("_sign"));
+    columns_.push_back(table_description_.sample_block.getByName("_version"));
+
+    for (const auto & col : columns_)
+    {
+        if (!table_description_.sample_block.has(col.name))
+        {
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "Having column {}, but no such column in table ({})",
+                            col.name, table_description_.sample_block.dumpStructure());
+        }
+
+        const auto & actual_column = table_description_.sample_block.getByName(col.name);
+        if (col.type != actual_column.type)
+        {
+            throw Exception(ErrorCodes::LOGICAL_ERROR,
+                            "Having column {} of type {}, but expected {}",
+                            col.name, col.type->getName(), actual_column.type->getName());
+        }
+    }
+
+    sample_block = Block(columns_);
+    columns = sample_block.cloneEmptyColumns();
+
+    for (const auto & name : sample_block.getNames())
+        columns_ast.children.emplace_back(std::make_shared<ASTIdentifier>(name));
+}
+
+MaterializedPostgreSQLConsumer::StorageData::Buffer & MaterializedPostgreSQLConsumer::StorageData::getLastBuffer()
+{
+    if (buffers.empty())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "No data buffer for {}",
+                        storage->getStorageID().getNameForLogs());
+    }
+
+    return *buffers.back();
+}
+
+MaterializedPostgreSQLConsumer::StorageData::BufferPtr MaterializedPostgreSQLConsumer::StorageData::popBuffer()
+{
+    if (buffers.empty())
+        return nullptr;
+
+    auto buffer = std::move(buffers.front());
+    buffers.pop_front();
+    return buffer;
+}
+
+void MaterializedPostgreSQLConsumer::StorageData::addBuffer(BufferPtr buffer)
+{
+    buffers.push_back(std::move(buffer));
+}
+
+void MaterializedPostgreSQLConsumer::StorageData::returnBuffer(BufferPtr buffer)
+{
+    buffers.push_front(std::move(buffer));
+}
+
+void MaterializedPostgreSQLConsumer::StorageData::Buffer::assertInsertIsPossible(size_t col_idx) const
+{
+    if (col_idx >= columns.size())
+    {
+        throw Exception(ErrorCodes::LOGICAL_ERROR,
                         "Attempt to insert into buffer at position: "
-                        "{}, but block columns size is {}, types size: {}, columns size: {}, buffer structure: {}",
-                        column_idx,
-                        buffer.description.sample_block.columns(),
-                        buffer.description.types.size(), buffer.columns.size(),
-                        buffer.description.sample_block.dumpStructure());
+                        "{}, but block columns size is {} (full structure: {})",
+                        col_idx, columns.size(), sample_block.dumpStructure());
+    }
 }
 
 
-void MaterializedPostgreSQLConsumer::insertValue(StorageData::Buffer & buffer, const std::string & value, size_t column_idx)
+void MaterializedPostgreSQLConsumer::insertValue(StorageData & storage_data, const std::string & value, size_t column_idx)
 {
-    assertCorrectInsertion(buffer, column_idx);
+    auto & buffer = storage_data.getLastBuffer();
+    buffer.assertInsertIsPossible(column_idx);
 
-    const auto & sample = buffer.description.sample_block.getByPosition(column_idx);
-    bool is_nullable = buffer.description.types[column_idx].second;
+    const auto & column_type_and_name = buffer.sample_block.getByPosition(column_idx);
+    auto & column = buffer.columns[column_idx];
+
+    const size_t column_idx_in_table = storage_data.table_description.sample_block.getPositionByName(column_type_and_name.name);
+    const auto & type_description = storage_data.table_description.types[column_idx_in_table];
 
     try
     {
-        if (is_nullable)
+        if (column_type_and_name.type->isNullable())
         {
-            ColumnNullable & column_nullable = assert_cast<ColumnNullable &>(*buffer.columns[column_idx]);
-            const auto & data_type = assert_cast<const DataTypeNullable &>(*sample.type);
+            ColumnNullable & column_nullable = assert_cast<ColumnNullable &>(*column);
+            const auto & data_type = assert_cast<const DataTypeNullable &>(*column_type_and_name.type);
 
             insertPostgreSQLValue(
-                    column_nullable.getNestedColumn(), value,
-                    buffer.description.types[column_idx].first, data_type.getNestedType(), buffer.array_info, column_idx);
+                    column_nullable.getNestedColumn(), value, type_description.first,
+                    data_type.getNestedType(), storage_data.array_info, column_idx_in_table);
 
             column_nullable.getNullMapData().emplace_back(0);
         }
         else
         {
             insertPostgreSQLValue(
-                    *buffer.columns[column_idx], value,
-                    buffer.description.types[column_idx].first, sample.type,
-                    buffer.array_info, column_idx);
+                *column, value, type_description.first, column_type_and_name.type,
+                storage_data.array_info, column_idx_in_table);
         }
     }
     catch (const pqxx::conversion_error & e)
     {
-        LOG_ERROR(log, "Conversion failed while inserting PostgreSQL value {}, will insert default value. Error: {}", value, e.what());
-        insertDefaultValue(buffer, column_idx);
+        LOG_ERROR(log, "Conversion failed while inserting PostgreSQL value {}, "
+                  "will insert default value. Error: {}", value, e.what());
+
+        insertDefaultPostgreSQLValue(*column, *column_type_and_name.column);
     }
 }
 
-
-void MaterializedPostgreSQLConsumer::insertDefaultValue(StorageData::Buffer & buffer, size_t column_idx)
+void MaterializedPostgreSQLConsumer::insertDefaultValue(StorageData & storage_data, size_t column_idx)
 {
-    assertCorrectInsertion(buffer, column_idx);
+    auto & buffer = storage_data.getLastBuffer();
+    buffer.assertInsertIsPossible(column_idx);
 
-    const auto & sample = buffer.description.sample_block.getByPosition(column_idx);
-    insertDefaultPostgreSQLValue(*buffer.columns[column_idx], *sample.column);
+    const auto & column_type_and_name = buffer.sample_block.getByPosition(column_idx);
+    auto & column = buffer.columns[column_idx];
+
+    insertDefaultPostgreSQLValue(*column, *column_type_and_name.column);
 }
 
-
 void MaterializedPostgreSQLConsumer::readString(const char * message, size_t & pos, size_t size, String & result)
 {
     assert(size > pos + 2);
@@ -173,7 +245,6 @@ void MaterializedPostgreSQLConsumer::readString(const char * message, size_t & p
     }
 }
 
-
 template<typename T>
 T MaterializedPostgreSQLConsumer::unhexN(const char * message, size_t pos, size_t n)
 {
@@ -186,7 +257,6 @@ T MaterializedPostgreSQLConsumer::unhexN(const char * message, size_t pos, size_
     return result;
 }
 
-
 Int64 MaterializedPostgreSQLConsumer::readInt64(const char * message, size_t & pos, [[maybe_unused]] size_t size)
 {
     assert(size >= pos + 16);
@@ -195,7 +265,6 @@ Int64 MaterializedPostgreSQLConsumer::readInt64(const char * message, size_t & p
     return result;
 }
 
-
 Int32 MaterializedPostgreSQLConsumer::readInt32(const char * message, size_t & pos, [[maybe_unused]] size_t size)
 {
     assert(size >= pos + 8);
@@ -204,7 +273,6 @@ Int32 MaterializedPostgreSQLConsumer::readInt32(const char * message, size_t & p
     return result;
 }
 
-
 Int16 MaterializedPostgreSQLConsumer::readInt16(const char * message, size_t & pos, [[maybe_unused]] size_t size)
 {
     assert(size >= pos + 4);
@@ -213,7 +281,6 @@ Int16 MaterializedPostgreSQLConsumer::readInt16(const char * message, size_t & p
     return result;
 }
 
-
 Int8 MaterializedPostgreSQLConsumer::readInt8(const char * message, size_t & pos, [[maybe_unused]] size_t size)
 {
     assert(size >= pos + 2);
@@ -222,25 +289,23 @@ Int8 MaterializedPostgreSQLConsumer::readInt8(const char * message, size_t & pos
     return result;
 }
 
-
 void MaterializedPostgreSQLConsumer::readTupleData(
-        StorageData::Buffer & buffer, const char * message, size_t & pos, [[maybe_unused]] size_t size, PostgreSQLQuery type, bool old_value)
+    StorageData & storage_data,
+    const char * message,
+    size_t & pos,
+    size_t size,
+    PostgreSQLQuery type,
+    bool old_value)
 {
     Int16 num_columns = readInt16(message, pos, size);
 
-    /// Sanity check. In fact, it was already checked.
-    if (static_cast<size_t>(num_columns) + 2 != buffer.getColumnsNum()) /// +2 -- sign and version columns
-        throw Exception(ErrorCodes::POSTGRESQL_REPLICATION_INTERNAL_ERROR,
-                        "Number of columns does not match. Got: {}, expected {}, current buffer structure: {}",
-                        num_columns, buffer.getColumnsNum(), buffer.description.sample_block.dumpStructure());
-
     auto proccess_column_value = [&](Int8 identifier, Int16 column_idx)
     {
         switch (identifier) // NOLINT(bugprone-switch-missing-default-case)
         {
             case 'n': /// NULL
             {
-                insertDefaultValue(buffer, column_idx);
+                insertDefaultValue(storage_data, column_idx);
                 break;
             }
             case 't': /// Text formatted value
@@ -250,7 +315,7 @@ void MaterializedPostgreSQLConsumer::readTupleData(
                 for (Int32 i = 0; i < col_len; ++i)
                     value += readInt8(message, pos, size);
 
-                insertValue(buffer, value, column_idx);
+                insertValue(storage_data, value, column_idx);
                 break;
             }
             case 'u': /// TOAST value && unchanged at the same time. Actual value is not sent.
@@ -258,13 +323,13 @@ void MaterializedPostgreSQLConsumer::readTupleData(
                 /// TOAST values are not supported. (TOAST values are values that are considered in postgres
                 /// to be too large to be stored directly)
                 LOG_WARNING(log, "Got TOAST value, which is not supported, default value will be used instead.");
-                insertDefaultValue(buffer, column_idx);
+                insertDefaultValue(storage_data, column_idx);
                 break;
             }
             case 'b': /// Binary data.
             {
                 LOG_WARNING(log, "We do not yet process this format of data, will insert default value");
-                insertDefaultValue(buffer, column_idx);
+                insertDefaultValue(storage_data, column_idx);
                 break;
             }
             default:
@@ -272,7 +337,7 @@ void MaterializedPostgreSQLConsumer::readTupleData(
                 LOG_WARNING(log, "Unexpected identifier: {}. This is a bug! Please report an issue on github", identifier);
                 chassert(false);
 
-                insertDefaultValue(buffer, column_idx);
+                insertDefaultValue(storage_data, column_idx);
                 break;
             }
         }
@@ -291,7 +356,7 @@ void MaterializedPostgreSQLConsumer::readTupleData(
                       "Got error while receiving value for column {}, will insert default value. Error: {}",
                       column_idx, getCurrentExceptionMessage(true));
 
-            insertDefaultValue(buffer, column_idx);
+            insertDefaultValue(storage_data, column_idx);
             /// Let's collect only the first exception.
             /// This delaying of error throw is needed because
             /// some errors can be ignored and just logged,
@@ -301,19 +366,20 @@ void MaterializedPostgreSQLConsumer::readTupleData(
         }
     }
 
+    auto & columns = storage_data.getLastBuffer().columns;
     switch (type)
     {
         case PostgreSQLQuery::INSERT:
         {
-            buffer.columns[num_columns]->insert(static_cast<Int8>(1));
-            buffer.columns[num_columns + 1]->insert(lsn_value);
+            columns[num_columns]->insert(static_cast<Int8>(1));
+            columns[num_columns + 1]->insert(lsn_value);
 
             break;
         }
         case PostgreSQLQuery::DELETE:
         {
-            buffer.columns[num_columns]->insert(static_cast<Int8>(-1));
-            buffer.columns[num_columns + 1]->insert(lsn_value);
+            columns[num_columns]->insert(static_cast<Int8>(-1));
+            columns[num_columns + 1]->insert(lsn_value);
 
             break;
         }
@@ -321,11 +387,11 @@ void MaterializedPostgreSQLConsumer::readTupleData(
         {
             /// Process old value in case changed value is a primary key.
             if (old_value)
-                buffer.columns[num_columns]->insert(static_cast<Int8>(-1));
+                columns[num_columns]->insert(static_cast<Int8>(-1));
             else
-                buffer.columns[num_columns]->insert(static_cast<Int8>(1));
+                columns[num_columns]->insert(static_cast<Int8>(1));
 
-            buffer.columns[num_columns + 1]->insert(lsn_value);
+            columns[num_columns + 1]->insert(lsn_value);
 
             break;
         }
@@ -335,7 +401,6 @@ void MaterializedPostgreSQLConsumer::readTupleData(
         std::rethrow_exception(error);
 }
 
-
 /// https://www.postgresql.org/docs/13/protocol-logicalrep-message-formats.html
 void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * replication_message, size_t size)
 {
@@ -366,10 +431,10 @@ void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * repl
                 return;
 
             Int8 new_tuple = readInt8(replication_message, pos, size);
-            auto & buffer = storages.find(table_name)->second.buffer;
+            auto & storage_data = storages.find(table_name)->second;
 
             if (new_tuple)
-                readTupleData(buffer, replication_message, pos, size, PostgreSQLQuery::INSERT);
+                readTupleData(storage_data, replication_message, pos, size, PostgreSQLQuery::INSERT);
 
             break;
         }
@@ -386,7 +451,7 @@ void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * repl
             if (!isSyncAllowed(relation_id, table_name))
                 return;
 
-            auto & buffer = storages.find(table_name)->second.buffer;
+            auto & storage_data = storages.find(table_name)->second;
 
             auto proccess_identifier = [&](Int8 identifier) -> bool
             {
@@ -401,13 +466,13 @@ void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * repl
                     /// it is much more efficient to use replica identity index, but support all possible cases.
                     case 'O':
                     {
-                        readTupleData(buffer, replication_message, pos, size, PostgreSQLQuery::UPDATE, true);
+                        readTupleData(storage_data, replication_message, pos, size, PostgreSQLQuery::UPDATE, true);
                         break;
                     }
                     case 'N':
                     {
                         /// New row.
-                        readTupleData(buffer, replication_message, pos, size, PostgreSQLQuery::UPDATE);
+                        readTupleData(storage_data, replication_message, pos, size, PostgreSQLQuery::UPDATE);
                         read_next = false;
                         break;
                     }
@@ -441,8 +506,8 @@ void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * repl
              /// 0 or 1 if replica identity is set to full. For now only default replica identity is supported (with primary keys).
             readInt8(replication_message, pos, size);
 
-            auto & buffer = storages.find(table_name)->second.buffer;
-            readTupleData(buffer, replication_message, pos, size, PostgreSQLQuery::DELETE);
+            auto & storage_data = storages.find(table_name)->second;
+            readTupleData(storage_data, replication_message, pos, size, PostgreSQLQuery::DELETE);
             break;
         }
         case 'C': // Commit
@@ -490,8 +555,6 @@ void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * repl
                 return;
             }
 
-            auto & buffer = storage_iter->second.buffer;
-
             /// 'd' - default (primary key if any)
             /// 'n' - nothing
             /// 'f' - all columns (set replica identity full)
@@ -507,47 +570,94 @@ void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * repl
                 return;
             }
 
+            auto log_table_structure_changed = [&](const std::string & reason)
+            {
+                LOG_INFO(log, "Table structure of the table {} changed ({}), "
+                         "will mark it as skipped from replication. "
+                         "Please perform manual DETACH and ATTACH of the table to bring it back",
+                         table_name, reason);
+            };
+
             Int16 num_columns = readInt16(replication_message, pos, size);
 
-            if (static_cast<size_t>(num_columns) + 2 != buffer.getColumnsNum()) /// +2 -- sign and version columns
-            {
-                markTableAsSkipped(relation_id, table_name);
-                return;
-            }
+            auto & storage_data = storage_iter->second;
+            const auto & description = storage_data.table_description;
 
-            if (static_cast<size_t>(num_columns) != buffer.attributes.size())
+            const size_t actual_columns_num = storage_data.getColumnsNum();
+            if (size_t(num_columns) > actual_columns_num - 2)
             {
-#ifndef NDEBUG
-                throw Exception(ErrorCodes::LOGICAL_ERROR,
-                                "Mismatch in attributes size. Got {}, expected {}. It's a bug. Current buffer structure: {}",
-                                num_columns, buffer.attributes.size(), buffer.description.sample_block.dumpStructure());
-#else
-                LOG_ERROR(log, "Mismatch in attributes size. Got {}, expected {}. It's a bug. Current buffer structure: {}",
-                          num_columns, buffer.attributes.size(), buffer.description.sample_block.dumpStructure());
+                log_table_structure_changed(fmt::format("received {} columns, expected {}", num_columns, actual_columns_num - 2));
                 markTableAsSkipped(relation_id, table_name);
                 return;
-#endif
             }
 
             Int32 data_type_id;
             Int32 type_modifier; /// For example, n in varchar(n)
 
+            std::set<std::string> all_columns(storage_data.column_names.begin(), storage_data.column_names.end());
+            std::set<std::string> received_columns;
+            ColumnsWithTypeAndName columns;
+
             for (uint16_t i = 0; i < num_columns; ++i)
             {
                 String column_name;
                 readInt8(replication_message, pos, size); /// Marks column as part of replica identity index
                 readString(replication_message, pos, size, column_name);
 
+                if (!all_columns.contains(column_name))
+                {
+                    log_table_structure_changed(fmt::format("column {} is not known", column_name));
+                    markTableAsSkipped(relation_id, table_name);
+                    return;
+                }
+
                 data_type_id = readInt32(replication_message, pos, size);
                 type_modifier = readInt32(replication_message, pos, size);
 
-                if (buffer.attributes[i].atttypid != data_type_id || buffer.attributes[i].atttypmod != type_modifier)
+                columns.push_back(description.sample_block.getByName(column_name));
+                received_columns.emplace(column_name);
+
+                const auto & attributes_it = storage_data.columns_attributes.find(column_name);
+                if (attributes_it == storage_data.columns_attributes.end())
+                    throw Exception(ErrorCodes::LOGICAL_ERROR, "No column {} in attributes", column_name);
+
+                const auto & attributes = attributes_it->second;
+                if (attributes.atttypid != data_type_id || attributes.atttypmod != type_modifier)
                 {
+                    log_table_structure_changed(fmt::format("column {} has a different type", column_name));
                     markTableAsSkipped(relation_id, table_name);
                     return;
                 }
             }
 
+
+            if (size_t(num_columns) < actual_columns_num)
+            {
+                std::vector<std::string> absent_columns;
+                std::set_difference(
+                    all_columns.begin(), all_columns.end(),
+                    received_columns.begin(), received_columns.end(), std::back_inserter(absent_columns));
+
+                for (const auto & name : absent_columns)
+                {
+                    if (name == "_sign" || name == "_version")
+                        continue;
+
+                    const auto & attributes_it = storage_data.columns_attributes.find(name);
+                    if (attributes_it == storage_data.columns_attributes.end())
+                        throw Exception(ErrorCodes::LOGICAL_ERROR, "No column {} in attributes", name);
+
+                    /// Column has a default value or it is a GENERATED columns.
+                    if (!attributes_it->second.attr_def.empty())
+                        continue;
+
+                    log_table_structure_changed(fmt::format("column {} was not found", name));
+                    markTableAsSkipped(relation_id, table_name);
+                    return;
+                }
+            }
+
+            storage_data.addBuffer(std::make_unique<StorageData::Buffer>(std::move(columns), description));
             tables_to_sync.insert(table_name);
             break;
         }
@@ -563,7 +673,6 @@ void MaterializedPostgreSQLConsumer::processReplicationMessage(const char * repl
     }
 }
 
-
 void MaterializedPostgreSQLConsumer::syncTables()
 {
     size_t synced_tables = 0;
@@ -571,40 +680,43 @@ void MaterializedPostgreSQLConsumer::syncTables()
     {
         auto table_name = *tables_to_sync.begin();
         auto & storage_data = storages.find(table_name)->second;
-        Block result_rows = storage_data.buffer.description.sample_block.cloneWithColumns(std::move(storage_data.buffer.columns));
-        storage_data.buffer.columns = storage_data.buffer.description.sample_block.cloneEmptyColumns();
 
-        try
+        while (auto buffer = storage_data.popBuffer())
         {
-            if (result_rows.rows())
+            Block result_rows = buffer->sample_block.cloneWithColumns(std::move(buffer->columns));
+            try
             {
-                auto storage = storage_data.storage;
+                if (result_rows.rows())
+                {
+                    auto storage = storage_data.storage;
 
-                auto insert_context = Context::createCopy(context);
-                insert_context->setInternalQuery(true);
+                    auto insert_context = Context::createCopy(context);
+                    insert_context->setInternalQuery(true);
 
-                auto insert = std::make_shared<ASTInsertQuery>();
-                insert->table_id = storage->getStorageID();
-                insert->columns = storage_data.buffer.columns_ast;
+                    auto insert = std::make_shared<ASTInsertQuery>();
+                    insert->table_id = storage->getStorageID();
+                    insert->columns = std::make_shared<ASTExpressionList>(buffer->columns_ast);
 
-                InterpreterInsertQuery interpreter(insert, insert_context, true);
-                auto io = interpreter.execute();
-                auto input = std::make_shared<SourceFromSingleChunk>(
-                    result_rows.cloneEmpty(), Chunk(result_rows.getColumns(), result_rows.rows()));
+                    InterpreterInsertQuery interpreter(insert, insert_context, true);
+                    auto io = interpreter.execute();
+                    auto input = std::make_shared<SourceFromSingleChunk>(
+                        result_rows.cloneEmpty(), Chunk(result_rows.getColumns(), result_rows.rows()));
 
-                assertBlocksHaveEqualStructure(input->getPort().getHeader(), io.pipeline.getHeader(), "postgresql replica table sync");
-                io.pipeline.complete(Pipe(std::move(input)));
+                    assertBlocksHaveEqualStructure(input->getPort().getHeader(), io.pipeline.getHeader(), "postgresql replica table sync");
+                    io.pipeline.complete(Pipe(std::move(input)));
 
-                CompletedPipelineExecutor executor(io.pipeline);
-                executor.execute();
-                ++synced_tables;
+                    CompletedPipelineExecutor executor(io.pipeline);
+                    executor.execute();
+                    ++synced_tables;
+                }
+            }
+            catch (...)
+            {
+                /// Retry this buffer later.
+                buffer->columns = result_rows.mutateColumns();
+                storage_data.returnBuffer(std::move(buffer));
+                throw;
             }
-        }
-        catch (...)
-        {
-            /// Retry this buffer later.
-            storage_data.buffer.columns = result_rows.mutateColumns();
-            throw;
         }
 
         tables_to_sync.erase(tables_to_sync.begin());
@@ -616,7 +728,6 @@ void MaterializedPostgreSQLConsumer::syncTables()
     updateLsn();
 }
 
-
 void MaterializedPostgreSQLConsumer::updateLsn()
 {
     try
@@ -632,7 +743,6 @@ void MaterializedPostgreSQLConsumer::updateLsn()
     }
 }
 
-
 String MaterializedPostgreSQLConsumer::advanceLSN(std::shared_ptr<pqxx::nontransaction> tx)
 {
     std::string query_str = fmt::format("SELECT end_lsn FROM pg_replication_slot_advance('{}', '{}')", replication_slot_name, final_lsn);
@@ -644,7 +754,6 @@ String MaterializedPostgreSQLConsumer::advanceLSN(std::shared_ptr<pqxx::nontrans
     return final_lsn;
 }
 
-
 /// Sync for some table might not be allowed if:
 /// 1. Table schema changed and might break synchronization.
 /// 2. There is no storage for this table. (As a result of some exception or incorrect pg_publication)
@@ -700,7 +809,6 @@ bool MaterializedPostgreSQLConsumer::isSyncAllowed(Int32 relation_id, const Stri
     return false;
 }
 
-
 void MaterializedPostgreSQLConsumer::markTableAsSkipped(Int32 relation_id, const String & relation_name)
 {
     skip_list.insert({relation_id, ""}); /// Empty lsn string means - continue waiting for valid lsn.
@@ -712,12 +820,11 @@ void MaterializedPostgreSQLConsumer::markTableAsSkipped(Int32 relation_id, const
         relation_name, relation_id);
 }
 
-
 void MaterializedPostgreSQLConsumer::addNested(
     const String & postgres_table_name, StorageInfo nested_storage_info, const String & table_start_lsn)
 {
     assert(!storages.contains(postgres_table_name));
-    storages.emplace(postgres_table_name, nested_storage_info);
+    storages.emplace(postgres_table_name, StorageData(nested_storage_info, log));
 
     auto it = deleted_tables.find(postgres_table_name);
     if (it != deleted_tables.end())
@@ -728,17 +835,15 @@ void MaterializedPostgreSQLConsumer::addNested(
     waiting_list[postgres_table_name] = table_start_lsn;
 }
 
-
 void MaterializedPostgreSQLConsumer::updateNested(const String & table_name, StorageInfo nested_storage_info, Int32 table_id, const String & table_start_lsn)
 {
     assert(!storages.contains(table_name));
-    storages.emplace(table_name, nested_storage_info);
+    storages.emplace(table_name, StorageData(nested_storage_info, log));
 
     /// Set start position to valid lsn. Before it was an empty string. Further read for table allowed, if it has a valid lsn.
     skip_list[table_id] = table_start_lsn;
 }
 
-
 void MaterializedPostgreSQLConsumer::removeNested(const String & postgres_table_name)
 {
     auto it = storages.find(postgres_table_name);
@@ -747,7 +852,6 @@ void MaterializedPostgreSQLConsumer::removeNested(const String & postgres_table_
     deleted_tables.insert(postgres_table_name);
 }
 
-
 void MaterializedPostgreSQLConsumer::setSetting(const SettingChange & setting)
 {
     if (setting.name == "materialized_postgresql_max_block_size")
@@ -756,7 +860,6 @@ void MaterializedPostgreSQLConsumer::setSetting(const SettingChange & setting)
         throw Exception(ErrorCodes::BAD_ARGUMENTS, "Unsupported setting: {}", setting.name);
 }
 
-
 /// Read binary changes from replication slot via COPY command (starting from current lsn in a slot).
 bool MaterializedPostgreSQLConsumer::consume()
 {
diff --git a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h
index 02cbedb4dd5..3e95c1cd7de 100644
--- a/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h
+++ b/src/Storages/PostgreSQL/MaterializedPostgreSQLConsumer.h
@@ -32,32 +32,42 @@ class MaterializedPostgreSQLConsumer
 private:
     struct StorageData
     {
-        struct Buffer
+        explicit StorageData(const StorageInfo & storage_info, Poco::Logger * log_);
+
+        size_t getColumnsNum() const { return table_description.sample_block.columns(); }
+
+        const Block & getSampleBlock() const { return table_description.sample_block; }
+
+        using ArrayInfo = std::unordered_map<size_t, PostgreSQLArrayInfo>;
+
+        const StoragePtr storage;
+        const ExternalResultDescription table_description;
+        const PostgreSQLTableStructure::Attributes columns_attributes;
+        const Names column_names;
+        const ArrayInfo array_info;
+
+        struct Buffer : private boost::noncopyable
         {
-            ExternalResultDescription description;
+            Block sample_block;
             MutableColumns columns;
+            ASTExpressionList columns_ast;
 
-            /// Needed to pass to insert query columns list in syncTables().
-            std::shared_ptr<ASTExpressionList> columns_ast;
-            /// Needed for insertPostgreSQLValue() method to parse array
-            std::unordered_map<size_t, PostgreSQLArrayInfo> array_info;
-            /// To validate ddl.
-            PostgreSQLTableStructure::Attributes attributes;
+            explicit Buffer(ColumnsWithTypeAndName && columns_, const ExternalResultDescription & table_description_);
 
-            Buffer(StorageMetadataPtr storage_metadata, const PostgreSQLTableStructure::Attributes & attributes_);
-
-            size_t getColumnsNum() const
-            {
-                const auto & sample_block = description.sample_block;
-                return sample_block.columns();
-            }
+            void assertInsertIsPossible(size_t col_idx) const;
         };
+        using BufferPtr = std::unique_ptr<Buffer>;
 
-        StoragePtr storage;
-        Buffer buffer;
+        Buffer & getLastBuffer();
 
-        explicit StorageData(const StorageInfo & storage_info);
-        StorageData(const StorageData & other) = delete;
+        BufferPtr popBuffer();
+
+        void addBuffer(BufferPtr buffer);
+
+        void returnBuffer(BufferPtr buffer);
+
+    private:
+        std::deque<BufferPtr> buffers;
     };
 
     using Storages = std::unordered_map<String, StorageData>;
@@ -97,8 +107,8 @@ private:
 
     bool isSyncAllowed(Int32 relation_id, const String & relation_name);
 
-    static void insertDefaultValue(StorageData::Buffer & buffer, size_t column_idx);
-    void insertValue(StorageData::Buffer & buffer, const std::string & value, size_t column_idx);
+    static void insertDefaultValue(StorageData & storage_data, size_t column_idx);
+    void insertValue(StorageData & storage_data, const std::string & value, size_t column_idx);
 
     enum class PostgreSQLQuery
     {
@@ -107,7 +117,7 @@ private:
         DELETE
     };
 
-    void readTupleData(StorageData::Buffer & buffer, const char * message, size_t & pos, size_t size, PostgreSQLQuery type, bool old_value = false);
+    void readTupleData(StorageData & storage_data, const char * message, size_t & pos, size_t size, PostgreSQLQuery type, bool old_value = false);
 
     template<typename T>
     static T unhexN(const char * message, size_t pos, size_t n);
@@ -119,8 +129,6 @@ private:
 
     void markTableAsSkipped(Int32 relation_id, const String & relation_name);
 
-    static void assertCorrectInsertion(StorageData::Buffer & buffer, size_t column_idx);
-
     /// lsn - log sequence number, like wal offset (64 bit).
     static Int64 getLSNValue(const std::string & lsn)
     {
diff --git a/src/Storages/PostgreSQL/PostgreSQLReplicationHandler.cpp b/src/Storages/PostgreSQL/PostgreSQLReplicationHandler.cpp
index ee38dcb44d4..43de2069b19 100644
--- a/src/Storages/PostgreSQL/PostgreSQLReplicationHandler.cpp
+++ b/src/Storages/PostgreSQL/PostgreSQLReplicationHandler.cpp
@@ -337,6 +337,7 @@ void PostgreSQLReplicationHandler::startSynchronization(bool throw_on_error)
             dropReplicationSlot(tx);
 
         initial_sync();
+        LOG_DEBUG(log, "Loaded {} tables", nested_storages.size());
     }
     /// Synchronization and initial load already took place - do not create any new tables, just fetch StoragePtr's
     /// and pass them to replication consumer.
@@ -414,16 +415,18 @@ StorageInfo PostgreSQLReplicationHandler::loadFromSnapshot(postgres::Connection
     std::string query_str = fmt::format("SET TRANSACTION SNAPSHOT '{}'", snapshot_name);
     tx->exec(query_str);
 
+    auto table_structure = fetchTableStructure(*tx, table_name);
+    if (!table_structure->physical_columns)
+        throw Exception(ErrorCodes::LOGICAL_ERROR, "No table attributes");
+
+    auto table_attributes = table_structure->physical_columns->attributes;
+
     /// Load from snapshot, which will show table state before creation of replication slot.
     /// Already connected to needed database, no need to add it to query.
     auto quoted_name = doubleQuoteWithSchema(table_name);
     query_str = fmt::format("SELECT * FROM ONLY {}", quoted_name);
-    LOG_DEBUG(log, "Loading PostgreSQL table {}.{}", postgres_database, quoted_name);
 
-    auto table_structure = fetchTableStructure(*tx, table_name);
-    if (!table_structure->physical_columns)
-        throw Exception(ErrorCodes::LOGICAL_ERROR, "No table attributes");
-    auto table_attributes = table_structure->physical_columns->attributes;
+    LOG_DEBUG(log, "Loading PostgreSQL table {}.{}", postgres_database, quoted_name);
 
     auto table_override = tryGetTableOverride(current_database_name, table_name);
     materialized_storage->createNestedIfNeeded(std::move(table_structure), table_override ? table_override->as<ASTTableOverride>() : nullptr);
@@ -449,7 +452,9 @@ StorageInfo PostgreSQLReplicationHandler::loadFromSnapshot(postgres::Connection
 
     materialized_storage->set(nested_storage);
     auto nested_table_id = nested_storage->getStorageID();
-    LOG_DEBUG(log, "Loaded table {}.{} (uuid: {})", nested_table_id.database_name, nested_table_id.table_name, toString(nested_table_id.uuid));
+
+    LOG_DEBUG(log, "Loaded table {}.{} (uuid: {})",
+              nested_table_id.database_name, nested_table_id.table_name, toString(nested_table_id.uuid));
 
     return StorageInfo(nested_storage, std::move(table_attributes));
 }
@@ -714,11 +719,9 @@ void PostgreSQLReplicationHandler::shutdownFinal()
                 dropReplicationSlot(tx, /* temporary */false);
         });
     }
-    catch (Exception & e)
+    catch (...)
     {
-        e.addMessage("while dropping replication slot: {}", replication_slot);
-        LOG_ERROR(log, "Failed to drop replication slot: {}. It must be dropped manually.", replication_slot);
-        throw;
+        LOG_ERROR(log, "Failed to drop replication slot: {}. It must be dropped manually. Error: {}", replication_slot, getCurrentExceptionMessage(true));
     }
 }
 
diff --git a/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp b/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp
index a287b96fe51..0faf553797a 100644
--- a/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp
+++ b/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.cpp
@@ -25,6 +25,8 @@
 #include <Parsers/ASTFunction.h>
 #include <Parsers/ASTIdentifier.h>
 #include <Parsers/ASTTablesInSelectQuery.h>
+#include <Parsers/ExpressionListParsers.h>
+#include <Parsers/formatAST.h>
 
 #include <Interpreters/applyTableOverride.h>
 #include <Interpreters/InterpreterDropQuery.h>
@@ -45,9 +47,6 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
 }
 
-static const auto NESTED_TABLE_SUFFIX = "_nested";
-static const auto TMP_SUFFIX = "_tmp";
-
 
 /// For the case of single storage.
 StorageMaterializedPostgreSQL::StorageMaterializedPostgreSQL(
@@ -195,7 +194,8 @@ void StorageMaterializedPostgreSQL::createNestedIfNeeded(PostgreSQLTableStructur
         const auto ast_create = getCreateNestedTableQuery(std::move(table_structure), table_override);
         auto table_id = getStorageID();
         auto tmp_nested_table_id = StorageID(table_id.database_name, getNestedTableName());
-        LOG_DEBUG(log, "Creating clickhouse table for postgresql table {}", table_id.getNameForLogs());
+        LOG_DEBUG(log, "Creating clickhouse table for postgresql table {} (ast: {})",
+                  table_id.getNameForLogs(), ast_create->formatForLogging());
 
         InterpreterCreateQuery interpreter(ast_create, nested_context);
         interpreter.execute();
@@ -359,7 +359,8 @@ ASTPtr StorageMaterializedPostgreSQL::getColumnDeclaration(const DataTypePtr & d
 }
 
 
-std::shared_ptr<ASTExpressionList> StorageMaterializedPostgreSQL::getColumnsExpressionList(const NamesAndTypesList & columns) const
+std::shared_ptr<ASTExpressionList>
+StorageMaterializedPostgreSQL::getColumnsExpressionList(const NamesAndTypesList & columns, std::unordered_map<std::string, ASTPtr> defaults) const
 {
     auto columns_expression_list = std::make_shared<ASTExpressionList>();
     for (const auto & [name, type] : columns)
@@ -369,6 +370,12 @@ std::shared_ptr<ASTExpressionList> StorageMaterializedPostgreSQL::getColumnsExpr
         column_declaration->name = name;
         column_declaration->type = getColumnDeclaration(type);
 
+        if (auto it = defaults.find(name); it != defaults.end())
+        {
+            column_declaration->default_expression = it->second;
+            column_declaration->default_specifier = "DEFAULT";
+        }
+
         columns_expression_list->children.emplace_back(column_declaration);
     }
     return columns_expression_list;
@@ -460,8 +467,28 @@ ASTPtr StorageMaterializedPostgreSQL::getCreateNestedTableQuery(
         }
         else
         {
-            ordinary_columns_and_types = table_structure->physical_columns->columns;
-            columns_declare_list->set(columns_declare_list->columns, getColumnsExpressionList(ordinary_columns_and_types));
+            const auto columns = table_structure->physical_columns;
+            std::unordered_map<std::string, ASTPtr> defaults;
+            for (const auto & col : columns->columns)
+            {
+                const auto & attr = columns->attributes.at(col.name);
+                if (!attr.attr_def.empty())
+                {
+                    ParserExpression expr_parser;
+                    Expected expected;
+                    ASTPtr result;
+
+                    Tokens tokens(attr.attr_def.data(), attr.attr_def.data() + attr.attr_def.size());
+                    IParser::Pos pos(tokens, DBMS_DEFAULT_MAX_PARSER_DEPTH);
+                    if (!expr_parser.parse(pos, result, expected))
+                    {
+                        throw Exception(ErrorCodes::BAD_ARGUMENTS, "Failed to parse default expression: {}", attr.attr_def);
+                    }
+                    defaults.emplace(col.name, result);
+                }
+            }
+            ordinary_columns_and_types = columns->columns;
+            columns_declare_list->set(columns_declare_list->columns, getColumnsExpressionList(ordinary_columns_and_types, defaults));
         }
 
         if (ordinary_columns_and_types.empty())
diff --git a/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.h b/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.h
index ca7b801cb7c..bebbb74ddd1 100644
--- a/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.h
+++ b/src/Storages/PostgreSQL/StorageMaterializedPostgreSQL.h
@@ -63,6 +63,9 @@ namespace DB
 class StorageMaterializedPostgreSQL final : public IStorage, WithContext
 {
 public:
+    static constexpr auto NESTED_TABLE_SUFFIX = "_nested";
+    static constexpr auto TMP_SUFFIX = "_tmp";
+
     StorageMaterializedPostgreSQL(const StorageID & table_id_, ContextPtr context_,
                                 const String & postgres_database_name, const String & postgres_table_name);
 
@@ -109,7 +112,8 @@ public:
 
     ASTPtr getCreateNestedTableQuery(PostgreSQLTableStructurePtr table_structure, const ASTTableOverride * table_override);
 
-    std::shared_ptr<ASTExpressionList> getColumnsExpressionList(const NamesAndTypesList & columns) const;
+    std::shared_ptr<ASTExpressionList> getColumnsExpressionList(
+        const NamesAndTypesList & columns, std::unordered_map<std::string, ASTPtr> defaults = {}) const;
 
     StoragePtr getNested() const;
 
diff --git a/src/Storages/RocksDB/StorageEmbeddedRocksDB.h b/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
index b59fe72ef47..b09dfca7338 100644
--- a/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
+++ b/src/Storages/RocksDB/StorageEmbeddedRocksDB.h
@@ -69,12 +69,6 @@ public:
         ContextPtr context) override;
 
     bool supportsParallelInsert() const override { return true; }
-    bool supportsIndexForIn() const override { return true; }
-    bool mayBenefitFromIndexForIn(
-        const ASTPtr & node, ContextPtr /*query_context*/, const StorageMetadataPtr & /*metadata_snapshot*/) const override
-    {
-        return node->getColumnName() == primary_key;
-    }
 
     bool storesDataOnDisk() const override { return true; }
     Strings getDataPaths() const override { return {rocksdb_dir}; }
diff --git a/src/Storages/S3Queue/StorageS3Queue.cpp b/src/Storages/S3Queue/StorageS3Queue.cpp
index 95cd80e898f..33e63d45c8d 100644
--- a/src/Storages/S3Queue/StorageS3Queue.cpp
+++ b/src/Storages/S3Queue/StorageS3Queue.cpp
@@ -493,12 +493,6 @@ void registerStorageS3QueueImpl(const String & name, StorageFactory & factory)
         name,
         [](const StorageFactory::Arguments & args)
         {
-            if (!args.attach && !args.getLocalContext()->getSettingsRef().allow_experimental_s3queue)
-            {
-                throw Exception(ErrorCodes::BAD_ARGUMENTS, "S3Queue is experimental. "
-                                "You can enable it with the `allow_experimental_s3queue` setting.");
-            }
-
             auto & engine_args = args.engine_args;
             if (engine_args.empty())
                 throw Exception(ErrorCodes::BAD_ARGUMENTS, "External data source must have arguments");
diff --git a/src/Storages/SelectQueryDescription.cpp b/src/Storages/SelectQueryDescription.cpp
index 37615a4187a..0c06c523515 100644
--- a/src/Storages/SelectQueryDescription.cpp
+++ b/src/Storages/SelectQueryDescription.cpp
@@ -113,8 +113,17 @@ static bool isSingleSelect(const ASTPtr & select, ASTPtr & res)
         return isSingleSelect(new_inner_query, res);
 }
 
-SelectQueryDescription SelectQueryDescription::getSelectQueryFromASTForMatView(const ASTPtr & select, ContextPtr context)
+SelectQueryDescription SelectQueryDescription::getSelectQueryFromASTForMatView(const ASTPtr & select, bool refreshable, ContextPtr context)
 {
+    SelectQueryDescription result;
+    result.select_query = select->as<ASTSelectWithUnionQuery &>().clone();
+
+    /// Skip all the checks, none of them apply to refreshable views.
+    /// Don't assign select_table_id. This way no materialized view dependency gets registered,
+    /// so data doesn't get pushed to the refreshable view on source table inserts.
+    if (refreshable)
+        return result;
+
     ASTPtr new_inner_query;
 
     if (!isSingleSelect(select, new_inner_query))
@@ -123,9 +132,7 @@ SelectQueryDescription SelectQueryDescription::getSelectQueryFromASTForMatView(c
     auto & select_query = new_inner_query->as<ASTSelectQuery &>();
     checkAllowedQueries(select_query);
 
-    SelectQueryDescription result;
     result.select_table_id = extractDependentTableFromSelectQuery(select_query, context);
-    result.select_query = select->as<ASTSelectWithUnionQuery &>().clone();
     result.inner_query = new_inner_query->clone();
 
     return result;
diff --git a/src/Storages/SelectQueryDescription.h b/src/Storages/SelectQueryDescription.h
index 6c608924508..1a10acdf925 100644
--- a/src/Storages/SelectQueryDescription.h
+++ b/src/Storages/SelectQueryDescription.h
@@ -9,7 +9,7 @@ namespace DB
 /// Select query for different view in storages
 struct SelectQueryDescription
 {
-    /// Table id for select query
+    /// Table id for select query. Only for non-refreshable materialized views.
     StorageID select_table_id = StorageID::createEmpty();
     /// Select query itself (ASTSelectWithUnionQuery)
     ASTPtr select_query;
@@ -18,7 +18,7 @@ struct SelectQueryDescription
 
     /// Parse description from select query for materialized view. Also
     /// validates query.
-    static SelectQueryDescription getSelectQueryFromASTForMatView(const ASTPtr & select, ContextPtr context);
+    static SelectQueryDescription getSelectQueryFromASTForMatView(const ASTPtr & select, bool refreshable, ContextPtr context);
 
     SelectQueryDescription() = default;
     SelectQueryDescription(const SelectQueryDescription & other);
diff --git a/src/Storages/StorageAzureBlob.cpp b/src/Storages/StorageAzureBlob.cpp
index cad9e1cbe92..9564bad485c 100644
--- a/src/Storages/StorageAzureBlob.cpp
+++ b/src/Storages/StorageAzureBlob.cpp
@@ -1229,11 +1229,18 @@ namespace
         {
         }
 
-        std::unique_ptr<ReadBuffer> next() override
+        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
         {
-            auto [key, metadata] = file_iterator->next();
+            /// For default mode check cached columns for currently read keys on first iteration.
+            if (first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            {
+                if (auto cached_columns = tryGetColumnsFromCache(read_keys.begin(), read_keys.end()))
+                    return {nullptr, cached_columns};
+            }
 
-            if (key.empty())
+            current_path_with_metadata = file_iterator->next();
+
+            if (current_path_with_metadata.relative_path.empty())
             {
                 if (first)
                     throw Exception(
@@ -1241,49 +1248,102 @@ namespace
                         "Cannot extract table structure from {} format file, because there are no files with provided path "
                         "in AzureBlobStorage. You must specify table structure manually", configuration.format);
 
-                return nullptr;
+                return {nullptr, std::nullopt};
             }
 
-            current_path = key;
+            first = false;
 
-            ///AzureBlobStorage file iterator could get new keys after new iteration, check them in schema cache.
-            if (getContext()->getSettingsRef().schema_inference_use_cache_for_azure && read_keys.size() > prev_read_keys_size)
+            /// AzureBlobStorage file iterator could get new keys after new iteration, check them in schema cache if schema inference mode is default.
+            if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT && read_keys.size() > prev_read_keys_size)
             {
-                columns_from_cache = StorageAzureBlob::tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end(), configuration, format_settings, getContext());
+                auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
                 prev_read_keys_size = read_keys.size();
                 if (columns_from_cache)
-                    return nullptr;
+                    return {nullptr, columns_from_cache};
+            }
+            else if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
+            {
+                RelativePathsWithMetadata paths = {current_path_with_metadata};
+                if (auto columns_from_cache = tryGetColumnsFromCache(paths.begin(), paths.end()))
+                    return {nullptr, columns_from_cache};
             }
 
             first = false;
             int zstd_window_log_max = static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max);
-            return wrapReadBufferWithCompressionMethod(
-                object_storage->readObject(StoredObject(key), getContext()->getReadSettings(), {}, metadata.size_bytes),
-                chooseCompressionMethod(key, configuration.compression_method),
-                zstd_window_log_max);
+            return {wrapReadBufferWithCompressionMethod(
+                object_storage->readObject(StoredObject(current_path_with_metadata.relative_path), getContext()->getReadSettings(), {}, current_path_with_metadata.metadata.size_bytes),
+                chooseCompressionMethod(current_path_with_metadata.relative_path, configuration.compression_method),
+                zstd_window_log_max), std::nullopt};
         }
 
-        std::optional<ColumnsDescription> getCachedColumns() override { return columns_from_cache; }
-
         void setNumRowsToLastFile(size_t num_rows) override
         {
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3)
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_azure)
                 return;
 
-            String source = fs::path(configuration.connection_url) / configuration.container / current_path;
+            String source = fs::path(configuration.connection_url) / configuration.container / current_path_with_metadata.relative_path;
             auto key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
             StorageAzureBlob::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
+        void setSchemaToLastFile(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_azure
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::UNION)
+                return;
+
+            String source = fs::path(configuration.connection_url) / configuration.container / current_path_with_metadata.relative_path;
+            auto key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+            StorageAzureBlob::getSchemaCache(getContext()).addColumns(key, columns);
+        }
+
+        void setResultingSchema(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_azure
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::DEFAULT)
+                return;
+
+            auto host_and_bucket = configuration.connection_url + '/' + configuration.container;
+            Strings sources;
+            sources.reserve(read_keys.size());
+            std::transform(read_keys.begin(), read_keys.end(), std::back_inserter(sources), [&](const auto & elem){ return host_and_bucket + '/' + elem.relative_path; });
+            auto cache_keys = getKeysForSchemaCache(sources, configuration.format, format_settings, getContext());
+            StorageAzureBlob::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
+        }
+
+        String getLastFileName() const override { return current_path_with_metadata.relative_path; }
+
     private:
+        std::optional<ColumnsDescription> tryGetColumnsFromCache(const RelativePathsWithMetadata::const_iterator & begin, const RelativePathsWithMetadata::const_iterator & end)
+        {
+            auto & schema_cache = StorageAzureBlob::getSchemaCache(getContext());
+            for (auto it = begin; it < end; ++it)
+            {
+                auto get_last_mod_time = [&] -> std::optional<time_t>
+                {
+                    if (it->metadata.last_modified)
+                        return it->metadata.last_modified->epochTime();
+                    return std::nullopt;
+                };
+
+                auto host_and_bucket = configuration.connection_url + '/' + configuration.container;
+                String source = host_and_bucket + '/' + it->relative_path;
+                auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
+                if (columns)
+                    return columns;
+            }
+
+            return std::nullopt;
+        }
+
         std::shared_ptr<StorageAzureBlobSource::IIterator> file_iterator;
         AzureObjectStorage * object_storage;
         const StorageAzureBlob::Configuration & configuration;
         const std::optional<FormatSettings> & format_settings;
         const RelativePathsWithMetadata & read_keys;
-        std::optional<ColumnsDescription> columns_from_cache;
         size_t prev_read_keys_size;
-        String current_path;
+        RelativePathWithMetadata current_path_with_metadata;
         bool first = true;
     };
 }
@@ -1313,72 +1373,8 @@ ColumnsDescription StorageAzureBlob::getTableStructureFromData(
             object_storage, configuration.container, configuration.blobs_paths, nullptr, NamesAndTypesList{}, ctx, &read_keys);
     }
 
-    std::optional<ColumnsDescription> columns_from_cache;
-    if (ctx->getSettingsRef().schema_inference_use_cache_for_azure)
-        columns_from_cache = tryGetColumnsFromCache(read_keys.begin(), read_keys.end(), configuration, format_settings, ctx);
-
-    ColumnsDescription columns;
-    if (columns_from_cache)
-    {
-        columns = *columns_from_cache;
-    }
-    else
-    {
-        ReadBufferIterator read_buffer_iterator(file_iterator, object_storage, configuration, format_settings, read_keys, ctx);
-        columns = readSchemaFromFormat(configuration.format, format_settings, read_buffer_iterator, configuration.withGlobs(), ctx);
-    }
-
-    if (ctx->getSettingsRef().schema_inference_use_cache_for_azure)
-        addColumnsToCache(read_keys, columns, configuration, format_settings, configuration.format, ctx);
-
-    return columns;
-
-}
-
-std::optional<ColumnsDescription> StorageAzureBlob::tryGetColumnsFromCache(
-        const RelativePathsWithMetadata::const_iterator & begin,
-        const RelativePathsWithMetadata::const_iterator & end,
-        const StorageAzureBlob::Configuration & configuration,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & ctx)
-{
-    auto & schema_cache = getSchemaCache(ctx);
-    for (auto it = begin; it < end; ++it)
-    {
-        auto get_last_mod_time = [&] -> std::optional<time_t>
-        {
-            if (it->metadata.last_modified)
-                return it->metadata.last_modified->epochTime();
-            return std::nullopt;
-        };
-
-        auto host_and_bucket = configuration.connection_url + '/' + configuration.container;
-        String source = host_and_bucket + '/' + it->relative_path;
-        auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, ctx);
-        auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-        if (columns)
-            return columns;
-    }
-
-    return std::nullopt;
-
-}
-
-void StorageAzureBlob::addColumnsToCache(
-    const RelativePathsWithMetadata & keys,
-    const ColumnsDescription & columns,
-    const StorageAzureBlob::Configuration & configuration,
-    const std::optional<FormatSettings> & format_settings,
-    const String & format_name,
-    const ContextPtr & ctx)
-{
-    auto host_and_bucket = configuration.connection_url + '/' + configuration.container;
-    Strings sources;
-    sources.reserve(keys.size());
-    std::transform(keys.begin(), keys.end(), std::back_inserter(sources), [&](const auto & elem){ return host_and_bucket + '/' + elem.relative_path; });
-    auto cache_keys = getKeysForSchemaCache(sources, format_name, format_settings, ctx);
-    auto & schema_cache = getSchemaCache(ctx);
-    schema_cache.addManyColumns(cache_keys, columns);
+    ReadBufferIterator read_buffer_iterator(file_iterator, object_storage, configuration, format_settings, read_keys, ctx);
+    return readSchemaFromFormat(configuration.format, format_settings, read_buffer_iterator, configuration.withGlobs(), ctx);
 }
 
 SchemaCache & StorageAzureBlob::getSchemaCache(const ContextPtr & ctx)
diff --git a/src/Storages/StorageAzureBlob.h b/src/Storages/StorageAzureBlob.h
index efb8185dd56..bf4f6f37efe 100644
--- a/src/Storages/StorageAzureBlob.h
+++ b/src/Storages/StorageAzureBlob.h
@@ -125,21 +125,6 @@ public:
         ContextPtr ctx,
         bool distributed_processing = false);
 
-    static std::optional<ColumnsDescription> tryGetColumnsFromCache(
-        const RelativePathsWithMetadata::const_iterator & begin,
-        const RelativePathsWithMetadata::const_iterator & end,
-        const StorageAzureBlob::Configuration & configuration,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & ctx);
-
-    static void addColumnsToCache(
-        const RelativePathsWithMetadata & keys,
-        const ColumnsDescription & columns,
-        const Configuration & configuration,
-        const std::optional<FormatSettings> & format_settings,
-        const String & format_name,
-        const ContextPtr & ctx);
-
 private:
     std::string name;
     Configuration configuration;
diff --git a/src/Storages/StorageBuffer.cpp b/src/Storages/StorageBuffer.cpp
index f3030dadc59..ba5d922dc86 100644
--- a/src/Storages/StorageBuffer.cpp
+++ b/src/Storages/StorageBuffer.cpp
@@ -665,15 +665,6 @@ SinkToStoragePtr StorageBuffer::write(const ASTPtr & /*query*/, const StorageMet
 }
 
 
-bool StorageBuffer::mayBenefitFromIndexForIn(
-    const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & /*metadata_snapshot*/) const
-{
-    if (auto destination = getDestinationTable())
-        return destination->mayBenefitFromIndexForIn(left_in_operand, query_context, destination->getInMemoryMetadataPtr());
-    return false;
-}
-
-
 void StorageBuffer::startup()
 {
     if (getContext()->getSettingsRef().readonly)
diff --git a/src/Storages/StorageBuffer.h b/src/Storages/StorageBuffer.h
index 94873ea04ce..ef646a12548 100644
--- a/src/Storages/StorageBuffer.h
+++ b/src/Storages/StorageBuffer.h
@@ -106,9 +106,6 @@ public:
     bool supportsSampling() const override { return true; }
     bool supportsPrewhere() const override;
     bool supportsFinal() const override { return true; }
-    bool supportsIndexForIn() const override { return true; }
-
-    bool mayBenefitFromIndexForIn(const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & metadata_snapshot) const override;
 
     void checkAlterIsPossible(const AlterCommands & commands, ContextPtr context) const override;
 
diff --git a/src/Storages/StorageDistributed.cpp b/src/Storages/StorageDistributed.cpp
index 90e8b9cae75..a928a4daf63 100644
--- a/src/Storages/StorageDistributed.cpp
+++ b/src/Storages/StorageDistributed.cpp
@@ -908,12 +908,21 @@ void StorageDistributed::read(
     }
 
     ClusterProxy::executeQuery(
-        query_plan, header, processed_stage,
-        main_table, remote_table_function_ptr,
-        select_stream_factory, log, modified_query_ast,
-        local_context, query_info,
-        sharding_key_expr, sharding_key_column_name,
-        query_info.cluster, additional_shard_filter_generator);
+        query_plan,
+        header,
+        processed_stage,
+        main_table,
+        remote_table_function_ptr,
+        select_stream_factory,
+        log,
+        modified_query_ast,
+        local_context,
+        query_info,
+        sharding_key_expr,
+        sharding_key_column_name,
+        query_info.cluster,
+        distributed_settings,
+        additional_shard_filter_generator);
 
     /// This is a bug, it is possible only when there is no shards to query, and this is handled earlier.
     if (!query_plan.isInitialized())
@@ -1291,8 +1300,6 @@ void StorageDistributed::drop()
 
         disk->removeRecursive(relative_data_path);
     }
-
-    LOG_DEBUG(log, "Removed");
 }
 
 Strings StorageDistributed::getDataPaths() const
@@ -1319,8 +1326,6 @@ void StorageDistributed::truncate(const ASTPtr &, const StorageMetadataPtr &, Co
         it->second.directory_queue->shutdownAndDropAllData();
         it = cluster_nodes_data.erase(it);
     }
-
-    LOG_DEBUG(log, "Removed");
 }
 
 StoragePolicyPtr StorageDistributed::getStoragePolicy() const
@@ -1371,9 +1376,13 @@ DistributedAsyncInsertDirectoryQueue & StorageDistributed::getDirectoryQueue(con
 
     std::lock_guard lock(cluster_nodes_mutex);
     auto & node_data = cluster_nodes_data[key];
-    if (!node_data.directory_queue)
+    /// If the node changes, you need to recreate the DistributedAsyncInsertDirectoryQueue
+    if (!node_data.directory_queue
+        || (node_data.clusters_version < getContext()->getClustersVersion() && node_data.addresses != parseAddresses(name)))
     {
-        node_data.connection_pool = DistributedAsyncInsertDirectoryQueue::createPool(name, *this);
+        node_data.addresses = parseAddresses(name);
+        node_data.clusters_version = getContext()->getClustersVersion();
+        node_data.connection_pool = DistributedAsyncInsertDirectoryQueue::createPool(node_data.addresses, *this);
         node_data.directory_queue = std::make_unique<DistributedAsyncInsertDirectoryQueue>(
             *this, disk, relative_data_path + name,
             node_data.connection_pool,
@@ -1393,6 +1402,53 @@ std::vector<DistributedAsyncInsertDirectoryQueue::Status> StorageDistributed::ge
     return statuses;
 }
 
+Cluster::Addresses StorageDistributed::parseAddresses(const std::string & name) const
+{
+    Cluster::Addresses addresses;
+
+    const auto & cluster = getCluster();
+    const auto & shards_info = cluster->getShardsInfo();
+    const auto & shards_addresses = cluster->getShardsAddresses();
+
+    for (auto it = boost::make_split_iterator(name, boost::first_finder(",")); it != decltype(it){}; ++it)
+    {
+        const std::string & dirname = boost::copy_range<std::string>(*it);
+        Cluster::Address address = Cluster::Address::fromFullString(dirname);
+
+        /// Check new format shard{shard_index}_replica{replica_index}
+        /// (shard_index and replica_index starts from 1).
+        if (address.shard_index)
+        {
+            if (address.shard_index > shards_info.size())
+            {
+                LOG_ERROR(log, "No shard with shard_index={} ({})", address.shard_index, name);
+                continue;
+            }
+
+            const auto & replicas_addresses = shards_addresses[address.shard_index - 1];
+            size_t replicas = replicas_addresses.size();
+
+            if (dirname.ends_with("_all_replicas"))
+            {
+                for (const auto & replica_address : replicas_addresses)
+                    addresses.push_back(replica_address);
+                continue;
+            }
+
+            if (address.replica_index > replicas)
+            {
+                LOG_ERROR(log, "No shard with replica_index={} ({})", address.replica_index, name);
+                continue;
+            }
+
+            addresses.push_back(replicas_addresses[address.replica_index - 1]);
+        }
+        else
+            addresses.push_back(address);
+    }
+    return addresses;
+}
+
 std::optional<UInt64> StorageDistributed::totalBytes(const Settings &) const
 {
     UInt64 total_bytes = 0;
diff --git a/src/Storages/StorageDistributed.h b/src/Storages/StorageDistributed.h
index 84de8a325f5..b7ed85e87df 100644
--- a/src/Storages/StorageDistributed.h
+++ b/src/Storages/StorageDistributed.h
@@ -176,6 +176,8 @@ private:
     /// Used for the INSERT into Distributed in case of distributed_foreground_insert==1, from DistributedSink.
     DistributedAsyncInsertDirectoryQueue & getDirectoryQueue(const DiskPtr & disk, const std::string & name);
 
+    /// Parse the address corresponding to the directory name of the directory queue
+    Cluster::Addresses parseAddresses(const std::string & name) const;
 
     /// Return list of metrics for all created monitors
     /// (note that monitors are created lazily, i.e. until at least one INSERT executed)
@@ -270,6 +272,8 @@ private:
     {
         std::shared_ptr<DistributedAsyncInsertDirectoryQueue> directory_queue;
         ConnectionPoolPtr connection_pool;
+        Cluster::Addresses addresses;
+        size_t clusters_version;
     };
     std::unordered_map<std::string, ClusterNodeData> cluster_nodes_data;
     mutable std::mutex cluster_nodes_mutex;
diff --git a/src/Storages/StorageFile.cpp b/src/Storages/StorageFile.cpp
index dc7ba3adbf0..25bb6691ff6 100644
--- a/src/Storages/StorageFile.cpp
+++ b/src/Storages/StorageFile.cpp
@@ -10,7 +10,6 @@
 #include <Interpreters/Context.h>
 #include <Interpreters/evaluateConstantExpression.h>
 
-#include <Parsers/ASTCreateQuery.h>
 #include <Parsers/ASTSelectQuery.h>
 #include <Parsers/ASTIdentifier_fwd.h>
 #include <Parsers/ASTInsertQuery.h>
@@ -26,8 +25,6 @@
 #include <IO/Archives/createArchiveReader.h>
 #include <IO/Archives/IArchiveReader.h>
 
-#include <DataTypes/DataTypeLowCardinality.h>
-#include <DataTypes/DataTypeString.h>
 #include <Formats/FormatFactory.h>
 #include <Formats/ReadSchemaUtils.h>
 #include <Processors/Formats/IInputFormat.h>
@@ -39,7 +36,6 @@
 #include <Processors/Formats/ISchemaReader.h>
 #include <Processors/Sources/NullSource.h>
 #include <Processors/Sources/ConstChunkGenerator.h>
-#include <Processors/ResizeProcessor.h>
 #include <Processors/Executors/PullingPipelineExecutor.h>
 
 #include <Common/escapeForFileName.h>
@@ -56,7 +52,6 @@
 #include <unistd.h>
 #include <filesystem>
 #include <shared_mutex>
-#include <cmath>
 #include <algorithm>
 
 #ifdef __clang__
@@ -299,13 +294,13 @@ struct stat getFileStat(const String & current_path, bool use_table_fd, int tabl
     {
         /// Check if file descriptor allows random reads (and reading it twice).
         if (0 != fstat(table_fd, &file_stat))
-            throwFromErrno("Cannot stat table file descriptor, inside " + storage_name, ErrorCodes::CANNOT_STAT);
+            throw ErrnoException(ErrorCodes::CANNOT_STAT, "Cannot stat table file descriptor, inside {}", storage_name);
     }
     else
     {
         /// Check if file descriptor allows random reads (and reading it twice).
         if (0 != stat(current_path.c_str(), &file_stat))
-            throwFromErrno("Cannot stat file " + current_path, ErrorCodes::CANNOT_STAT);
+            throw ErrnoException(ErrorCodes::CANNOT_STAT, "Cannot stat file {}", current_path);
     }
 
     return file_stat;
@@ -392,11 +387,19 @@ namespace
         {
         }
 
-        std::unique_ptr<ReadBuffer> next() override
+        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
         {
+            bool is_first = current_index == 0;
+            /// For default mode check cached columns for all paths on first iteration.
+            /// If we have cached columns, next() won't be called again.
+            if (is_first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            {
+                if (auto cached_columns = tryGetColumnsFromCache(paths))
+                    return {nullptr, cached_columns};
+            }
+
             String path;
             struct stat file_stat;
-            bool is_first = current_index == 0;
 
             do
             {
@@ -407,14 +410,21 @@ namespace
                             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
                             "Cannot extract table structure from {} format file, because all files are empty. You must specify table structure manually",
                             format);
-                    return nullptr;
+                    return {nullptr, std::nullopt};
                 }
 
                 path = paths[current_index++];
                 file_stat = getFileStat(path, false, -1, "File");
             } while (getContext()->getSettingsRef().engine_file_skip_empty_files && file_stat.st_size == 0);
 
-            return createReadBuffer(path, file_stat, false, -1, compression_method, getContext());
+            /// For union mode, check cached columns only for current path, because schema can be different for different files.
+            if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
+            {
+                if (auto cached_columns = tryGetColumnsFromCache({path}))
+                    return {nullptr, cached_columns};
+            }
+
+            return {createReadBuffer(path, file_stat, false, -1, compression_method, getContext()), std::nullopt};
         }
 
         void setNumRowsToLastFile(size_t num_rows) override
@@ -426,7 +436,64 @@ namespace
             StorageFile::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
+        void setSchemaToLastFile(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_file
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::UNION)
+                return;
+
+            /// For union mode, schema can be different for different files, so we need to
+            /// cache last inferred schema only for last processed file.
+            auto cache_key = getKeyForSchemaCache(paths[current_index - 1], format, format_settings, getContext());
+            StorageFile::getSchemaCache(getContext()).addColumns(cache_key, columns);
+        }
+
+        void setResultingSchema(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_file
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::DEFAULT)
+                return;
+
+            /// For default mode we cache resulting schema for all paths.
+            auto cache_keys = getKeysForSchemaCache(paths, format, format_settings, getContext());
+            StorageFile::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
+        }
+
+        String getLastFileName() const override
+        {
+            if (current_index != 0)
+                return paths[current_index - 1];
+            return "";
+        }
+
     private:
+        std::optional<ColumnsDescription> tryGetColumnsFromCache(const Strings & paths_)
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_file)
+                return std::nullopt;
+
+            /// Check if the cache contains one of the paths.
+            auto & schema_cache = StorageFile::getSchemaCache(getContext());
+            struct stat file_stat{};
+            for (const auto & path : paths_)
+            {
+                auto get_last_mod_time = [&]() -> std::optional<time_t>
+                {
+                    if (0 != stat(path.c_str(), &file_stat))
+                        return std::nullopt;
+
+                    return file_stat.st_mtime;
+                };
+
+                auto cache_key = getKeyForSchemaCache(path, format, format_settings, getContext());
+                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
+                if (columns)
+                    return columns;
+            }
+
+            return std::nullopt;
+        }
+
         const std::vector<String> & paths;
 
         size_t current_index = 0;
@@ -450,8 +517,19 @@ namespace
         {
         }
 
-        std::unique_ptr<ReadBuffer> next() override
+        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
         {
+            /// For default mode check cached columns for all initial archive paths (maybe with globs) on first iteration.
+            /// If we have cached columns, next() won't be called again.
+            if (is_first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            {
+                for (const auto & archive : archive_info.paths_to_archives)
+                {
+                    if (auto cached_columns = tryGetColumnsFromSchemaCache(archive, archive_info.path_in_archive))
+                        return {nullptr, cached_columns};
+                }
+            }
+
             std::unique_ptr<ReadBuffer> read_buf;
             while (true)
             {
@@ -463,7 +541,7 @@ namespace
                             "Cannot extract table structure from {} format file, because all files are empty. You must specify table structure manually",
                             format);
 
-                    return nullptr;
+                    return {nullptr, std::nullopt};
                 }
 
                 const auto & archive = archive_info.paths_to_archives[current_archive_index];
@@ -494,11 +572,11 @@ namespace
                     if (!read_buf)
                         continue;
 
-                    last_read_file_path = processed_files.emplace_back(fmt::format("{}::{}", archive_reader->getPath(), archive_info.path_in_archive));
-                    columns_from_cache = tryGetColumnsFromSchemaCache(archive, last_read_file_path);
+                    last_read_file_path = paths_for_schema_cache.emplace_back(fmt::format("{}::{}", archive_reader->getPath(), archive_info.path_in_archive));
+                    is_first = false;
 
-                    if (columns_from_cache)
-                        return nullptr;
+                    if (auto cached_columns = tryGetColumnsFromSchemaCache(archive, last_read_file_path))
+                        return {nullptr, cached_columns};
                 }
                 else
                 {
@@ -531,11 +609,17 @@ namespace
                         continue;
                     }
 
-                    last_read_file_path = processed_files.emplace_back(fmt::format("{}::{}", archive_reader->getPath(), *filename));
-                    columns_from_cache = tryGetColumnsFromSchemaCache(archive, last_read_file_path);
+                    last_read_file_path = paths_for_schema_cache.emplace_back(fmt::format("{}::{}", archive_reader->getPath(), *filename));
+                    is_first = false;
 
-                    if (columns_from_cache)
-                        return nullptr;
+                    if (auto cached_columns = tryGetColumnsFromSchemaCache(archive, last_read_file_path))
+                    {
+                        /// For union mode next() will be called again even if we found cached columns,
+                        /// so we need to remember last_read_buffer to continue iterating through files in archive.
+                        if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
+                            last_read_buffer = archive_reader->readFile(std::move(file_enumerator));
+                        return {nullptr, cached_columns};
+                    }
 
                     read_buf = archive_reader->readFile(std::move(file_enumerator));
                 }
@@ -543,18 +627,13 @@ namespace
                 break;
             }
 
-            is_first = false;
-            return read_buf;
-        }
-
-        std::optional<ColumnsDescription> getCachedColumns() override
-        {
-            return columns_from_cache;
+            return {std::move(read_buf), std::nullopt};
         }
 
         void setPreviousReadBuffer(std::unique_ptr<ReadBuffer> buffer) override
         {
-            last_read_buffer = std::move(buffer);
+            if (buffer)
+                last_read_buffer = std::move(buffer);
         }
 
         void setNumRowsToLastFile(size_t num_rows) override
@@ -566,13 +645,45 @@ namespace
             StorageFile::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
-        std::vector<std::string> processed_files;
-    private:
+        void setSchemaToLastFile(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_file
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::UNION)
+                return;
 
+            /// For union mode, schema can be different for different files in archive, so we need to
+            /// cache last inferred schema only for last processed file.
+            auto & schema_cache = StorageFile::getSchemaCache(getContext());
+            auto cache_key = getKeyForSchemaCache(last_read_file_path, format, format_settings, getContext());
+            schema_cache.addColumns(cache_key, columns);
+        }
+
+        void setResultingSchema(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_file
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::DEFAULT)
+                return;
+
+            /// For default mode we cache resulting schema for all paths.
+            /// Also add schema for initial paths (maybe with globes) in cache,
+            /// so next time we won't iterate through files (that can be expensive).
+            for (const auto & archive : archive_info.paths_to_archives)
+                paths_for_schema_cache.emplace_back(fmt::format("{}::{}", archive, archive_info.path_in_archive));
+            auto & schema_cache = StorageFile::getSchemaCache(getContext());
+            auto cache_keys = getKeysForSchemaCache(paths_for_schema_cache, format, format_settings, getContext());
+            schema_cache.addManyColumns(cache_keys, columns);
+        }
+
+        String getLastFileName() const override
+        {
+            return last_read_file_path;
+        }
+
+    private:
         std::optional<ColumnsDescription> tryGetColumnsFromSchemaCache(const std::string & archive_path, const std::string & full_path)
         {
             auto context = getContext();
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_file)
+            if (!context->getSettingsRef().schema_inference_use_cache_for_file)
                 return std::nullopt;
 
             struct stat file_stat;
@@ -602,44 +713,13 @@ namespace
 
         std::string last_read_file_path;
 
-        std::optional<ColumnsDescription> columns_from_cache;
-
         std::unique_ptr<IArchiveReader::FileEnumerator> file_enumerator;
         std::unique_ptr<ReadBuffer> last_read_buffer;
 
         String format;
         const std::optional<FormatSettings> & format_settings;
+        std::vector<std::string> paths_for_schema_cache;
     };
-
-    std::optional<ColumnsDescription> tryGetColumnsFromCacheForArchives(
-        const StorageFile::ArchiveInfo & archive_info,
-        std::vector<std::string> & paths_for_schema_cache,
-        const String & format,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & context)
-    {
-        struct stat file_stat{};
-        std::optional<ColumnsDescription> columns_from_cache;
-
-        for (const auto & archive : archive_info.paths_to_archives)
-        {
-            const auto & full_path = paths_for_schema_cache.emplace_back(fmt::format("{}::{}", archive, archive_info.path_in_archive));
-
-            auto & schema_cache = StorageFile::getSchemaCache(context);
-            auto get_last_mod_time = [&]() -> std::optional<time_t>
-            {
-                if (0 != stat(archive.c_str(), &file_stat))
-                    return std::nullopt;
-
-                return file_stat.st_mtime;
-            };
-
-            auto cache_key = getKeyForSchemaCache(full_path, format, format_settings, context);
-            columns_from_cache = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-        }
-
-        return columns_from_cache;
-    }
 }
 
 ColumnsDescription StorageFile::getTableStructureFromFileDescriptor(ContextPtr context)
@@ -692,48 +772,19 @@ ColumnsDescription StorageFile::getTableStructureFromFile(
             "Cannot extract table structure from {} format file, because there are no files with provided path. "
             "You must specify table structure manually", format);
 
-    ColumnsDescription columns;
-    std::vector<std::string> archive_paths_for_schema_cache;
-    std::optional<ColumnsDescription> columns_from_cache;
-
-    if (context->getSettingsRef().schema_inference_use_cache_for_file)
+    if (archive_info)
     {
-        if (archive_info)
-            columns_from_cache = tryGetColumnsFromCacheForArchives(*archive_info, archive_paths_for_schema_cache, format, format_settings, context);
-        else
-            columns_from_cache = tryGetColumnsFromCache(paths, format, format_settings, context);
+        ReadBufferFromArchiveIterator read_buffer_iterator(*archive_info, format, format_settings, context);
+        return readSchemaFromFormat(
+            format,
+            format_settings,
+            read_buffer_iterator,
+            /*retry=*/archive_info->paths_to_archives.size() > 1 || !archive_info->isSingleFileRead(),
+            context);
     }
 
-    if (columns_from_cache)
-    {
-        columns = std::move(*columns_from_cache);
-    }
-    else
-    {
-        if (archive_info)
-        {
-            ReadBufferFromArchiveIterator read_buffer_iterator(*archive_info, format, format_settings, context);
-            columns = readSchemaFromFormat(
-                format,
-                format_settings,
-                read_buffer_iterator,
-                /*retry=*/archive_info->paths_to_archives.size() > 1 || !archive_info->isSingleFileRead(),
-                context);
-
-            for (auto & file : read_buffer_iterator.processed_files)
-                archive_paths_for_schema_cache.push_back(std::move(file));
-        }
-        else
-        {
-            ReadBufferFromFileIterator read_buffer_iterator(paths, format, compression_method, format_settings, context);
-            columns = readSchemaFromFormat(format, format_settings, read_buffer_iterator, paths.size() > 1, context);
-        }
-    }
-
-    if (context->getSettingsRef().schema_inference_use_cache_for_file)
-        addColumnsToCache(archive_info.has_value() ? archive_paths_for_schema_cache : paths, columns, format, format_settings, context);
-
-    return columns;
+    ReadBufferFromFileIterator read_buffer_iterator(paths, format, compression_method, format_settings, context);
+    return readSchemaFromFormat(format, format_settings, read_buffer_iterator, paths.size() > 1, context);
 }
 
 bool StorageFile::supportsSubsetOfColumns(const ContextPtr & context) const
@@ -757,7 +808,7 @@ StorageFile::StorageFile(int table_fd_, CommonArguments args)
     struct stat buf;
     int res = fstat(table_fd_, &buf);
     if (-1 == res)
-        throwFromErrno("Cannot execute fstat", res, ErrorCodes::CANNOT_FSTAT);
+        throw ErrnoException(ErrorCodes::CANNOT_FSTAT, "Cannot execute fstat");
     total_bytes_to_read = buf.st_size;
 
     if (args.getContext()->getApplicationType() == Context::ApplicationType::SERVER)
@@ -1737,7 +1788,7 @@ void StorageFile::truncate(
     if (use_table_fd)
     {
         if (0 != ::ftruncate(table_fd, 0))
-            throwFromErrno("Cannot truncate file at fd " + toString(table_fd), ErrorCodes::CANNOT_TRUNCATE_FILE);
+            throw ErrnoException(ErrorCodes::CANNOT_TRUNCATE_FILE, "Cannot truncate file at fd {}", toString(table_fd));
     }
     else
     {
@@ -1747,7 +1798,7 @@ void StorageFile::truncate(
                 continue;
 
             if (0 != ::truncate(path.c_str(), 0))
-                throwFromErrnoWithPath("Cannot truncate file " + path, path, ErrorCodes::CANNOT_TRUNCATE_FILE);
+                ErrnoException::throwFromPath(ErrorCodes::CANNOT_TRUNCATE_FILE, path, "Cannot truncate file at {}", path);
         }
     }
 }
@@ -1874,43 +1925,6 @@ SchemaCache & StorageFile::getSchemaCache(const ContextPtr & context)
     return schema_cache;
 }
 
-std::optional<ColumnsDescription> StorageFile::tryGetColumnsFromCache(
-    const Strings & paths, const String & format_name, const std::optional<FormatSettings> & format_settings, ContextPtr context)
-{
-    /// Check if the cache contains one of the paths.
-    auto & schema_cache = getSchemaCache(context);
-    struct stat file_stat{};
-    for (const auto & path : paths)
-    {
-        auto get_last_mod_time = [&]() -> std::optional<time_t>
-        {
-            if (0 != stat(path.c_str(), &file_stat))
-                return std::nullopt;
-
-            return file_stat.st_mtime;
-        };
-
-        auto cache_key = getKeyForSchemaCache(path, format_name, format_settings, context);
-        auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-        if (columns)
-            return columns;
-    }
-
-    return std::nullopt;
-}
-
-void StorageFile::addColumnsToCache(
-    const Strings & paths,
-    const ColumnsDescription & columns,
-    const String & format_name,
-    const std::optional<FormatSettings> & format_settings,
-    const ContextPtr & context)
-{
-    auto & schema_cache = getSchemaCache(context);
-    auto cache_keys = getKeysForSchemaCache(paths, format_name, format_settings, context);
-    schema_cache.addManyColumns(cache_keys, columns);
-}
-
 void StorageFile::parseFileSource(String source, String & filename, String & path_to_archive)
 {
     size_t pos = source.find("::");
@@ -1921,7 +1935,7 @@ void StorageFile::parseFileSource(String source, String & filename, String & pat
     }
 
     std::string_view path_to_archive_view = std::string_view{source}.substr(0, pos);
-    while (path_to_archive_view.back() == ' ')
+    while (path_to_archive_view.ends_with(' '))
         path_to_archive_view.remove_suffix(1);
 
     if (path_to_archive_view.empty())
diff --git a/src/Storages/StorageFile.h b/src/Storages/StorageFile.h
index 0a16abf406d..1fd3f2e0edf 100644
--- a/src/Storages/StorageFile.h
+++ b/src/Storages/StorageFile.h
@@ -141,16 +141,6 @@ protected:
 private:
     void setStorageMetadata(CommonArguments args);
 
-    static std::optional<ColumnsDescription> tryGetColumnsFromCache(
-        const Strings & paths, const String & format_name, const std::optional<FormatSettings> & format_settings, ContextPtr context);
-
-    static void addColumnsToCache(
-        const Strings & paths,
-        const ColumnsDescription & columns,
-        const String & format_name,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & context);
-
     std::string format_name;
     // We use format settings from global context + CREATE query for File table
     // function -- in this case, format_settings is set.
diff --git a/src/Storages/StorageFuzzJSON.cpp b/src/Storages/StorageFuzzJSON.cpp
index 8b2dd7ac692..87790dd2fdc 100644
--- a/src/Storages/StorageFuzzJSON.cpp
+++ b/src/Storages/StorageFuzzJSON.cpp
@@ -248,10 +248,10 @@ Field generateRandomFixedValue(const StorageFuzzJSON::Configuration & config, pc
     return f;
 }
 
-String fuzzJSONKey(const StorageFuzzJSON::Configuration & config, pcg64 & rnd, const String & source)
+String fuzzString(UInt64 min_length, UInt64 max_length, pcg64 & rnd, const String & source, std::function<char(pcg64 &)> charGen)
 {
     String result;
-    result.reserve(config.max_key_length);
+    result.reserve(max_length);
 
     using FA = FuzzAction;
     auto get_action = [&]() -> FuzzAction
@@ -261,7 +261,7 @@ String fuzzJSONKey(const StorageFuzzJSON::Configuration & config, pcg64 & rnd, c
     };
 
     size_t i = 0;
-    while (i < source.size() && result.size() < config.max_key_length)
+    while (i < source.size() && result.size() < max_length)
     {
         auto action = get_action();
         switch (action)
@@ -271,12 +271,12 @@ String fuzzJSONKey(const StorageFuzzJSON::Configuration & config, pcg64 & rnd, c
             }
             break;
             case FA::Edit: {
-                result.push_back(generateRandomKeyCharacter(rnd));
+                result.push_back(charGen(rnd));
                 ++i;
             }
             break;
             case FA::Add: {
-                result.push_back(generateRandomKeyCharacter(rnd));
+                result.push_back(charGen(rnd));
             }
             break;
             default:
@@ -284,12 +284,24 @@ String fuzzJSONKey(const StorageFuzzJSON::Configuration & config, pcg64 & rnd, c
         }
     }
 
-    while (result.size() < config.min_key_length)
-        result.push_back(generateRandomKeyCharacter(rnd));
+    while (result.size() < min_length)
+        result.push_back(charGen(rnd));
 
     return result;
 }
 
+String fuzzJSONKey(const StorageFuzzJSON::Configuration & config, pcg64 & rnd, const String & key)
+{
+    return fuzzString(config.min_key_length, config.max_key_length, rnd, key, generateRandomKeyCharacter);
+}
+
+// Randomly modify structural characters (e.g. '{', '}', '[', ']', ':', '"') to generate output that cannot be parsed as JSON.
+String fuzzJSONStructure(const StorageFuzzJSON::Configuration & config, pcg64 & rnd, const String & s)
+{
+    return config.should_malform_output ? fuzzString(/*min_length*/ 0, /*max_length*/ s.size(), rnd, s, generateRandomStringValueCharacter)
+                                        : s;
+}
+
 std::shared_ptr<JSONNode>
 generateRandomJSONNode(const StorageFuzzJSON::Configuration & config, pcg64 & rnd, bool with_key, JSONValue::Type type)
 {
@@ -397,7 +409,7 @@ void fuzzJSONObject(
     if (next_node->key)
     {
         writeDoubleQuoted(*next_node->key, out);
-        out << ":";
+        out << fuzzJSONStructure(config, rnd, ":");
     }
 
     auto & val = next_node->value;
@@ -405,7 +417,11 @@ void fuzzJSONObject(
     if (val.fixed)
     {
         if (val.fixed->getType() == Field::Types::Which::String)
-            writeDoubleQuoted(val.fixed->get<String>(), out);
+        {
+            out << fuzzJSONStructure(config, rnd, "\"");
+            writeText(val.fixed->get<String>(), out);
+            out << fuzzJSONStructure(config, rnd, "\"");
+        }
         else
             writeFieldText(*val.fixed, out);
     }
@@ -414,9 +430,9 @@ void fuzzJSONObject(
         if (!val.array && !val.object)
             return;
 
-        const auto & [op, cl, node_list] = val.array ? std::make_tuple('[', ']', *val.array) : std::make_tuple('{', '}', *val.object);
+        const auto & [op, cl, node_list] = val.array ? std::make_tuple("[", "]", *val.array) : std::make_tuple("{", "}", *val.object);
 
-        out << op;
+        out << fuzzJSONStructure(config, rnd, op);
 
         bool first = true;
         for (const auto & ptr : node_list)
@@ -426,7 +442,7 @@ void fuzzJSONObject(
 
             WriteBufferFromOwnString child_out;
             if (!first)
-                child_out << ", ";
+                child_out << fuzzJSONStructure(config, rnd, ", ");
             first = false;
 
             fuzzJSONObject(ptr, child_out, config, rnd, depth + 1, node_count);
@@ -435,7 +451,7 @@ void fuzzJSONObject(
                 break;
             out << child_out.str();
         }
-        out << cl;
+        out << fuzzJSONStructure(config, rnd, cl);
     }
 }
 
@@ -465,7 +481,11 @@ protected:
     {
         Columns columns;
         columns.reserve(block_header.columns());
-        columns.emplace_back(createColumn());
+        for (const auto & col : block_header)
+        {
+            chassert(col.type->getTypeId() == TypeIndex::String);
+            columns.emplace_back(createColumn());
+        }
 
         return {std::move(columns), block_size};
     }
@@ -554,10 +574,11 @@ Pipe StorageFuzzJSON::read(
     return Pipe::unitePipes(std::move(pipes));
 }
 
-static constexpr std::array<std::string_view, 13> optional_configuration_keys
+static constexpr std::array<std::string_view, 14> optional_configuration_keys
     = {"json_str",
        "random_seed",
        "reuse_output",
+       "malform_output",
        "probability",
        "max_output_length",
        "max_nesting_level",
@@ -583,6 +604,9 @@ void StorageFuzzJSON::processNamedCollectionResult(Configuration & configuration
     if (collection.has("reuse_output"))
         configuration.should_reuse_output = static_cast<bool>(collection.get<UInt64>("reuse_output"));
 
+    if (collection.has("malform_output"))
+        configuration.should_malform_output = static_cast<bool>(collection.get<UInt64>("malform_output"));
+
     if (collection.has("probability"))
     {
         configuration.probability = collection.get<Float64>("probability");
@@ -699,6 +723,11 @@ void registerStorageFuzzJSON(StorageFactory & factory)
                 throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "Storage FuzzJSON must have arguments.");
 
             StorageFuzzJSON::Configuration configuration = StorageFuzzJSON::getConfiguration(engine_args, args.getLocalContext());
+
+            for (const auto& col : args.columns)
+                if (col.type->getTypeId() != TypeIndex::String)
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS, "'StorageFuzzJSON' supports only columns of String type, got {}.", col.type->getName());
+
             return std::make_shared<StorageFuzzJSON>(args.table_id, args.columns, args.comment, configuration);
         });
 }
diff --git a/src/Storages/StorageFuzzJSON.h b/src/Storages/StorageFuzzJSON.h
index f1d78fba85c..027c5a98634 100644
--- a/src/Storages/StorageFuzzJSON.h
+++ b/src/Storages/StorageFuzzJSON.h
@@ -27,6 +27,7 @@ public:
         String json_str = "{}";
         UInt64 random_seed = randomSeed();
         bool should_reuse_output = false;
+        bool should_malform_output = false;
         Float64 probability = 0.25;
 
         UInt64 max_output_length = 1024;
diff --git a/src/Storages/StorageGenerateRandom.cpp b/src/Storages/StorageGenerateRandom.cpp
index aef68899ef9..fbce6c2bb7d 100644
--- a/src/Storages/StorageGenerateRandom.cpp
+++ b/src/Storages/StorageGenerateRandom.cpp
@@ -532,7 +532,7 @@ class GenerateSource : public ISource
 {
 public:
     GenerateSource(UInt64 block_size_, UInt64 max_array_length_, UInt64 max_string_length_, UInt64 random_seed_, Block block_header_, ContextPtr context_)
-        : ISource(Nested::flattenArrayOfTuples(prepareBlockToFill(block_header_)))
+        : ISource(Nested::flattenNested(prepareBlockToFill(block_header_)))
         , block_size(block_size_), max_array_length(max_array_length_), max_string_length(max_string_length_)
         , block_to_fill(std::move(block_header_)), rng(random_seed_), context(context_) {}
 
@@ -547,7 +547,7 @@ protected:
         for (const auto & elem : block_to_fill)
             columns.emplace_back(fillColumnWithRandomData(elem.type, block_size, max_array_length, max_string_length, rng, context));
 
-        columns = Nested::flattenArrayOfTuples(block_to_fill.cloneWithColumns(columns)).getColumns();
+        columns = Nested::flattenNested(block_to_fill.cloneWithColumns(columns)).getColumns();
         return {std::move(columns), block_size};
     }
 
diff --git a/src/Storages/StorageInMemoryMetadata.cpp b/src/Storages/StorageInMemoryMetadata.cpp
index af285a953dc..cece70eddfa 100644
--- a/src/Storages/StorageInMemoryMetadata.cpp
+++ b/src/Storages/StorageInMemoryMetadata.cpp
@@ -40,6 +40,7 @@ StorageInMemoryMetadata::StorageInMemoryMetadata(const StorageInMemoryMetadata &
     , table_ttl(other.table_ttl)
     , settings_changes(other.settings_changes ? other.settings_changes->clone() : nullptr)
     , select(other.select)
+    , refresh(other.refresh ? other.refresh->clone() : nullptr)
     , comment(other.comment)
     , metadata_version(other.metadata_version)
 {
@@ -69,6 +70,7 @@ StorageInMemoryMetadata & StorageInMemoryMetadata::operator=(const StorageInMemo
     else
         settings_changes.reset();
     select = other.select;
+    refresh = other.refresh ? other.refresh->clone() : nullptr;
     comment = other.comment;
     metadata_version = other.metadata_version;
     return *this;
@@ -124,6 +126,11 @@ void StorageInMemoryMetadata::setSelectQuery(const SelectQueryDescription & sele
     select = select_;
 }
 
+void StorageInMemoryMetadata::setRefresh(ASTPtr refresh_)
+{
+    refresh = refresh_;
+}
+
 void StorageInMemoryMetadata::setMetadataVersion(int32_t metadata_version_)
 {
     metadata_version = metadata_version_;
diff --git a/src/Storages/StorageInMemoryMetadata.h b/src/Storages/StorageInMemoryMetadata.h
index 30b2b303492..ecc30f7b756 100644
--- a/src/Storages/StorageInMemoryMetadata.h
+++ b/src/Storages/StorageInMemoryMetadata.h
@@ -9,6 +9,7 @@
 #include <Storages/KeyDescription.h>
 #include <Storages/SelectQueryDescription.h>
 #include <Storages/TTLDescription.h>
+#include <Storages/MaterializedView/RefreshSchedule.h>
 
 #include <Common/MultiVersion.h>
 
@@ -47,6 +48,8 @@ struct StorageInMemoryMetadata
     ASTPtr settings_changes;
     /// SELECT QUERY. Supported for MaterializedView and View (have to support LiveView).
     SelectQueryDescription select;
+    /// Materialized view REFRESH parameters.
+    ASTPtr refresh;
 
     String comment;
 
@@ -94,6 +97,9 @@ struct StorageInMemoryMetadata
     /// Set SELECT query for (Materialized)View
     void setSelectQuery(const SelectQueryDescription & select_);
 
+    /// Set refresh parameters for materialized view (REFRESH ... [DEPENDS ON ...] [SETTINGS ...]).
+    void setRefresh(ASTPtr refresh_);
+
     /// Set version of metadata.
     void setMetadataVersion(int32_t metadata_version_);
     /// Get copy of current metadata with metadata_version_
diff --git a/src/Storages/StorageJoin.cpp b/src/Storages/StorageJoin.cpp
index 121d859a3f2..efe446a8ccd 100644
--- a/src/Storages/StorageJoin.cpp
+++ b/src/Storages/StorageJoin.cpp
@@ -535,8 +535,7 @@ private:
 #undef M
 
             default:
-                throw Exception(ErrorCodes::UNSUPPORTED_JOIN_KEYS, "Unsupported JOIN keys in StorageJoin. Type: {}",
-                                static_cast<UInt32>(join->data->type));
+                throw Exception(ErrorCodes::UNSUPPORTED_JOIN_KEYS, "Unsupported JOIN keys of type {} in StorageJoin", join->data->type);
         }
 
         if (!rows_added)
diff --git a/src/Storages/StorageKeeperMap.h b/src/Storages/StorageKeeperMap.h
index 10eebdd0129..aa9687243d8 100644
--- a/src/Storages/StorageKeeperMap.h
+++ b/src/Storages/StorageKeeperMap.h
@@ -67,12 +67,6 @@ public:
     void mutate(const MutationCommands & commands, ContextPtr context) override;
 
     bool supportsParallelInsert() const override { return true; }
-    bool supportsIndexForIn() const override { return true; }
-    bool mayBenefitFromIndexForIn(
-        const ASTPtr & node, ContextPtr /*query_context*/, const StorageMetadataPtr & /*metadata_snapshot*/) const override
-    {
-        return node->getColumnName() == primary_key;
-    }
     bool supportsDelete() const override { return true; }
 
     void backupData(BackupEntriesCollector & backup_entries_collector, const String & data_path_in_backup, const std::optional<ASTs> & partitions) override;
diff --git a/src/Storages/StorageMaterializedView.cpp b/src/Storages/StorageMaterializedView.cpp
index a7e2f246cec..b06fe00f5b2 100644
--- a/src/Storages/StorageMaterializedView.cpp
+++ b/src/Storages/StorageMaterializedView.cpp
@@ -1,5 +1,7 @@
 #include <Storages/StorageMaterializedView.h>
 
+#include <Storages/MaterializedView/RefreshTask.h>
+
 #include <Parsers/ASTSelectWithUnionQuery.h>
 #include <Parsers/ASTCreateQuery.h>
 
@@ -7,6 +9,7 @@
 #include <Interpreters/InterpreterCreateQuery.h>
 #include <Interpreters/InterpreterDropQuery.h>
 #include <Interpreters/InterpreterRenameQuery.h>
+#include <Interpreters/InterpreterInsertQuery.h>
 #include <Interpreters/getTableExpressions.h>
 #include <Interpreters/getHeaderForProcessingStage.h>
 #include <Access/Common/AccessFlags.h>
@@ -35,7 +38,11 @@ namespace ErrorCodes
     extern const int BAD_ARGUMENTS;
     extern const int NOT_IMPLEMENTED;
     extern const int INCORRECT_QUERY;
-    extern const int QUERY_IS_NOT_SUPPORTED_IN_MATERIALIZED_VIEW;
+}
+
+namespace ActionLocks
+{
+    extern const StorageActionBlockType ViewRefresh;
 }
 
 static inline String generateInnerTableName(const StorageID & view_id)
@@ -79,13 +86,12 @@ StorageMaterializedView::StorageMaterializedView(
                         "You must specify where to save results of a MaterializedView query: "
                         "either ENGINE or an existing table in a TO clause");
 
-    if (query.select->list_of_selects->children.size() != 1)
-        throw Exception(ErrorCodes::QUERY_IS_NOT_SUPPORTED_IN_MATERIALIZED_VIEW, "UNION is not supported for MATERIALIZED VIEW");
-
-    auto select = SelectQueryDescription::getSelectQueryFromASTForMatView(query.select->clone(), local_context);
+    auto select = SelectQueryDescription::getSelectQueryFromASTForMatView(query.select->clone(), query.refresh_strategy != nullptr, local_context);
     storage_metadata.setSelectQuery(select);
     if (!comment.empty())
         storage_metadata.setComment(comment);
+    if (query.refresh_strategy)
+        storage_metadata.setRefresh(query.refresh_strategy->clone());
 
     setInMemoryMetadata(storage_metadata);
 
@@ -126,6 +132,15 @@ StorageMaterializedView::StorageMaterializedView(
 
         target_table_id = DatabaseCatalog::instance().getTable({manual_create_query->getDatabase(), manual_create_query->getTable()}, getContext())->getStorageID();
     }
+
+    if (query.refresh_strategy)
+    {
+        refresher = RefreshTask::create(
+            *this,
+            getContext(),
+            *query.refresh_strategy);
+        refresh_on_start = !attach_ && !query.is_create_empty;
+    }
 }
 
 QueryProcessingStage::Enum StorageMaterializedView::getQueryProcessingStage(
@@ -236,23 +251,24 @@ void StorageMaterializedView::dropInnerTableIfAny(bool sync, ContextPtr local_co
     /// See the comment in StorageMaterializedView::drop.
     /// DDL queries with StorageMaterializedView are fundamentally broken.
     /// Best-effort to make them work: the inner table name is almost always less than the MV name (so it's safe to lock DDLGuard)
-    bool may_lock_ddl_guard = getStorageID().getQualifiedName() < target_table_id.getQualifiedName();
+    auto inner_table_id = getTargetTableId();
+    bool may_lock_ddl_guard = getStorageID().getQualifiedName() < inner_table_id.getQualifiedName();
     if (has_inner_table && tryGetTargetTable())
-        InterpreterDropQuery::executeDropQuery(ASTDropQuery::Kind::Drop, getContext(), local_context, target_table_id,
+        InterpreterDropQuery::executeDropQuery(ASTDropQuery::Kind::Drop, getContext(), local_context, inner_table_id,
                                                sync, /* ignore_sync_setting */ true, may_lock_ddl_guard);
 }
 
 void StorageMaterializedView::truncate(const ASTPtr &, const StorageMetadataPtr &, ContextPtr local_context, TableExclusiveLockHolder &)
 {
     if (has_inner_table)
-        InterpreterDropQuery::executeDropQuery(ASTDropQuery::Kind::Truncate, getContext(), local_context, target_table_id, true);
+        InterpreterDropQuery::executeDropQuery(ASTDropQuery::Kind::Truncate, getContext(), local_context, getTargetTableId(), true);
 }
 
 void StorageMaterializedView::checkStatementCanBeForwarded() const
 {
     if (!has_inner_table)
         throw Exception(ErrorCodes::INCORRECT_QUERY, "MATERIALIZED VIEW targets existing table {}. "
-            "Execute the statement directly on it.", target_table_id.getNameForLogs());
+            "Execute the statement directly on it.", getTargetTableId().getNameForLogs());
 }
 
 bool StorageMaterializedView::optimize(
@@ -268,7 +284,61 @@ bool StorageMaterializedView::optimize(
     checkStatementCanBeForwarded();
     auto storage_ptr = getTargetTable();
     auto metadata_snapshot = storage_ptr->getInMemoryMetadataPtr();
-    return getTargetTable()->optimize(query, metadata_snapshot, partition, final, deduplicate, deduplicate_by_columns, cleanup, local_context);
+    return storage_ptr->optimize(query, metadata_snapshot, partition, final, deduplicate, deduplicate_by_columns, cleanup, local_context);
+}
+
+std::tuple<ContextMutablePtr, std::shared_ptr<ASTInsertQuery>> StorageMaterializedView::prepareRefresh() const
+{
+    auto refresh_context = Context::createCopy(getContext());
+    /// Generate a random query id.
+    refresh_context->setCurrentQueryId("");
+
+    CurrentThread::QueryScope query_scope(refresh_context);
+
+    auto inner_table_id = getTargetTableId();
+    auto new_table_name = ".tmp" + generateInnerTableName(getStorageID());
+
+    auto db = DatabaseCatalog::instance().getDatabase(inner_table_id.database_name);
+
+    auto create_table_query = db->getCreateTableQuery(inner_table_id.table_name, getContext());
+    auto & create_query = create_table_query->as<ASTCreateQuery &>();
+    create_query.setTable(new_table_name);
+    create_query.setDatabase(db->getDatabaseName());
+    create_query.create_or_replace = true;
+    create_query.replace_table = true;
+    create_query.uuid = UUIDHelpers::Nil;
+
+    InterpreterCreateQuery create_interpreter(create_table_query, refresh_context);
+    create_interpreter.setInternal(true);
+    create_interpreter.execute();
+
+    StorageID fresh_table = DatabaseCatalog::instance().getTable({create_query.getDatabase(), create_query.getTable()}, getContext())->getStorageID();
+
+    auto insert_query = std::make_shared<ASTInsertQuery>();
+    insert_query->select = getInMemoryMetadataPtr()->getSelectQuery().select_query;
+    insert_query->setTable(fresh_table.table_name);
+    insert_query->setDatabase(fresh_table.database_name);
+    insert_query->table_id = fresh_table;
+
+    return {refresh_context, insert_query};
+}
+
+StorageID StorageMaterializedView::exchangeTargetTable(StorageID fresh_table, ContextPtr refresh_context)
+{
+    auto stale_table_id = getTargetTableId();
+
+    auto db = DatabaseCatalog::instance().getDatabase(stale_table_id.database_name);
+    auto target_db = DatabaseCatalog::instance().getDatabase(fresh_table.database_name);
+
+    CurrentThread::QueryScope query_scope(refresh_context);
+
+    target_db->renameTable(
+        refresh_context, fresh_table.table_name, *db, stale_table_id.table_name, /*exchange=*/true, /*dictionary=*/false);
+
+    std::swap(stale_table_id.database_name, fresh_table.database_name);
+    std::swap(stale_table_id.table_name, fresh_table.table_name);
+    setTargetTableId(std::move(fresh_table));
+    return stale_table_id;
 }
 
 void StorageMaterializedView::alter(
@@ -290,6 +360,9 @@ void StorageMaterializedView::alter(
 
     DatabaseCatalog::instance().getDatabase(table_id.database_name)->alterTable(local_context, table_id, new_metadata);
     setInMemoryMetadata(new_metadata);
+
+    if (refresher)
+        refresher->alterRefreshParams(new_metadata.refresh->as<const ASTRefreshStrategy &>());
 }
 
 
@@ -297,9 +370,14 @@ void StorageMaterializedView::checkAlterIsPossible(const AlterCommands & command
 {
     for (const auto & command : commands)
     {
-        if (!command.isCommentAlter() && command.type != AlterCommand::MODIFY_QUERY)
-            throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Alter of type '{}' is not supported by storage {}",
-                command.type, getName());
+        if (command.isCommentAlter())
+            continue;
+        if (command.type == AlterCommand::MODIFY_QUERY)
+            continue;
+        if (command.type == AlterCommand::MODIFY_REFRESH && refresher)
+            continue;
+        throw Exception(ErrorCodes::NOT_IMPLEMENTED, "Alter of type '{}' is not supported by storage {}",
+            command.type, getName());
     }
 }
 
@@ -333,6 +411,7 @@ void StorageMaterializedView::mutate(const MutationCommands & commands, ContextP
 void StorageMaterializedView::renameInMemory(const StorageID & new_table_id)
 {
     auto old_table_id = getStorageID();
+    auto inner_table_id = getTargetTableId();
     auto metadata_snapshot = getInMemoryMetadataPtr();
     bool from_atomic_to_atomic_database = old_table_id.hasUUID() && new_table_id.hasUUID();
 
@@ -341,14 +420,14 @@ void StorageMaterializedView::renameInMemory(const StorageID & new_table_id)
         auto new_target_table_name = generateInnerTableName(new_table_id);
         auto rename = std::make_shared<ASTRenameQuery>();
 
-        assert(target_table_id.database_name == old_table_id.database_name);
+        assert(inner_table_id.database_name == old_table_id.database_name);
 
         ASTRenameQuery::Element elem
         {
             ASTRenameQuery::Table
             {
-                target_table_id.database_name.empty() ? nullptr : std::make_shared<ASTIdentifier>(target_table_id.database_name),
-                std::make_shared<ASTIdentifier>(target_table_id.table_name)
+                inner_table_id.database_name.empty() ? nullptr : std::make_shared<ASTIdentifier>(inner_table_id.database_name),
+                std::make_shared<ASTIdentifier>(inner_table_id.table_name)
             },
             ASTRenameQuery::Table
             {
@@ -359,19 +438,21 @@ void StorageMaterializedView::renameInMemory(const StorageID & new_table_id)
         rename->elements.emplace_back(std::move(elem));
 
         InterpreterRenameQuery(rename, getContext()).execute();
-        target_table_id.database_name = new_table_id.database_name;
-        target_table_id.table_name = new_target_table_name;
+        updateTargetTableId(new_table_id.database_name, new_target_table_name);
     }
 
     IStorage::renameInMemory(new_table_id);
     if (from_atomic_to_atomic_database && has_inner_table)
     {
-        assert(target_table_id.database_name == old_table_id.database_name);
-        target_table_id.database_name = new_table_id.database_name;
+        assert(inner_table_id.database_name == old_table_id.database_name);
+        updateTargetTableId(new_table_id.database_name, std::nullopt);
     }
     const auto & select_query = metadata_snapshot->getSelectQuery();
     // TODO Actually we don't need to update dependency if MV has UUID, but then db and table name will be outdated
     DatabaseCatalog::instance().updateViewDependency(select_query.select_table_id, old_table_id, select_query.select_table_id, getStorageID());
+
+    if (refresher)
+        refresher->rename(new_table_id);
 }
 
 void StorageMaterializedView::startup()
@@ -380,10 +461,21 @@ void StorageMaterializedView::startup()
     const auto & select_query = metadata_snapshot->getSelectQuery();
     if (!select_query.select_table_id.empty())
         DatabaseCatalog::instance().addViewDependency(select_query.select_table_id, getStorageID());
+
+    if (refresher)
+    {
+        refresher->initializeAndStart(std::static_pointer_cast<StorageMaterializedView>(shared_from_this()));
+
+        if (refresh_on_start)
+            refresher->run();
+    }
 }
 
 void StorageMaterializedView::shutdown(bool)
 {
+    if (refresher)
+        refresher->shutdown();
+
     auto metadata_snapshot = getInMemoryMetadataPtr();
     const auto & select_query = metadata_snapshot->getSelectQuery();
     /// Make sure the dependency is removed after DETACH TABLE
@@ -394,13 +486,13 @@ void StorageMaterializedView::shutdown(bool)
 StoragePtr StorageMaterializedView::getTargetTable() const
 {
     checkStackSize();
-    return DatabaseCatalog::instance().getTable(target_table_id, getContext());
+    return DatabaseCatalog::instance().getTable(getTargetTableId(), getContext());
 }
 
 StoragePtr StorageMaterializedView::tryGetTargetTable() const
 {
     checkStackSize();
-    return DatabaseCatalog::instance().tryGetTable(target_table_id, getContext());
+    return DatabaseCatalog::instance().tryGetTable(getTargetTableId(), getContext());
 }
 
 NamesAndTypesList StorageMaterializedView::getVirtuals() const
@@ -461,8 +553,20 @@ std::optional<UInt64> StorageMaterializedView::totalBytes(const Settings & setti
     return {};
 }
 
+std::optional<UInt64> StorageMaterializedView::totalBytesUncompressed(const Settings & settings) const
+{
+    if (hasInnerTable())
+    {
+        if (auto table = tryGetTargetTable())
+            return table->totalBytesUncompressed(settings);
+    }
+    return {};
+}
+
 ActionLock StorageMaterializedView::getActionLock(StorageActionBlockType type)
 {
+    if (type == ActionLocks::ViewRefresh && refresher)
+        refresher->stop();
     if (has_inner_table)
     {
         if (auto target_table = tryGetTargetTable())
@@ -478,6 +582,33 @@ bool StorageMaterializedView::isRemote() const
     return false;
 }
 
+void StorageMaterializedView::onActionLockRemove(StorageActionBlockType action_type)
+{
+    if (action_type == ActionLocks::ViewRefresh && refresher)
+        refresher->start();
+}
+
+DB::StorageID StorageMaterializedView::getTargetTableId() const
+{
+    std::lock_guard guard(target_table_id_mutex);
+    return target_table_id;
+}
+
+void StorageMaterializedView::setTargetTableId(DB::StorageID id)
+{
+    std::lock_guard guard(target_table_id_mutex);
+    target_table_id = std::move(id);
+}
+
+void StorageMaterializedView::updateTargetTableId(std::optional<String> database_name, std::optional<String> table_name)
+{
+    std::lock_guard guard(target_table_id_mutex);
+    if (database_name)
+        target_table_id.database_name = *std::move(database_name);
+    if (table_name)
+        target_table_id.table_name = *std::move(table_name);
+}
+
 void registerStorageMaterializedView(StorageFactory & factory)
 {
     factory.registerStorage("MaterializedView", [](const StorageFactory::Arguments & args)
diff --git a/src/Storages/StorageMaterializedView.h b/src/Storages/StorageMaterializedView.h
index ae38cfb7e59..abca5833d26 100644
--- a/src/Storages/StorageMaterializedView.h
+++ b/src/Storages/StorageMaterializedView.h
@@ -5,6 +5,7 @@
 #include <Storages/IStorage.h>
 #include <Storages/StorageInMemoryMetadata.h>
 
+#include <Storages/MaterializedView/RefreshTask_fwd.h>
 
 namespace DB
 {
@@ -29,16 +30,9 @@ public:
     bool supportsSampling() const override { return getTargetTable()->supportsSampling(); }
     bool supportsPrewhere() const override { return getTargetTable()->supportsPrewhere(); }
     bool supportsFinal() const override { return getTargetTable()->supportsFinal(); }
-    bool supportsIndexForIn() const override { return getTargetTable()->supportsIndexForIn(); }
     bool supportsParallelInsert() const override { return getTargetTable()->supportsParallelInsert(); }
     bool supportsSubcolumns() const override { return getTargetTable()->supportsSubcolumns(); }
     bool supportsTransactions() const override { return getTargetTable()->supportsTransactions(); }
-    bool mayBenefitFromIndexForIn(const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & /* metadata_snapshot */) const override
-    {
-        auto target_table = getTargetTable();
-        auto metadata_snapshot = target_table->getInMemoryMetadataPtr();
-        return target_table->mayBenefitFromIndexForIn(left_in_operand, query_context, metadata_snapshot);
-    }
 
     SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
@@ -84,6 +78,7 @@ public:
     NamesAndTypesList getVirtuals() const override;
 
     ActionLock getActionLock(StorageActionBlockType type) override;
+    void onActionLockRemove(StorageActionBlockType action_type) override;
 
     void read(
         QueryPlan & query_plan,
@@ -103,14 +98,30 @@ public:
 
     std::optional<UInt64> totalRows(const Settings & settings) const override;
     std::optional<UInt64> totalBytes(const Settings & settings) const override;
+    std::optional<UInt64> totalBytesUncompressed(const Settings & settings) const override;
 
 private:
+    mutable std::mutex target_table_id_mutex;
     /// Will be initialized in constructor
     StorageID target_table_id = StorageID::createEmpty();
 
+    RefreshTaskHolder refresher;
+    bool refresh_on_start = false;
+
     bool has_inner_table = false;
 
+    friend class RefreshTask;
+
     void checkStatementCanBeForwarded() const;
+
+    /// Prepare to refresh a refreshable materialized view: create query context, create temporary
+    /// table, form the insert-select query.
+    std::tuple<ContextMutablePtr, std::shared_ptr<ASTInsertQuery>> prepareRefresh() const;
+    StorageID exchangeTargetTable(StorageID fresh_table, ContextPtr refresh_context);
+
+    StorageID getTargetTableId() const;
+    void setTargetTableId(StorageID id);
+    void updateTargetTableId(std::optional<String> database_name, std::optional<String> table_name);
 };
 
 }
diff --git a/src/Storages/StorageMerge.cpp b/src/Storages/StorageMerge.cpp
index 10c98fe6ce8..5d4f50baa53 100644
--- a/src/Storages/StorageMerge.cpp
+++ b/src/Storages/StorageMerge.cpp
@@ -80,7 +80,6 @@ namespace ErrorCodes
 {
     extern const int BAD_ARGUMENTS;
     extern const int NOT_IMPLEMENTED;
-    extern const int ILLEGAL_PREWHERE;
     extern const int NUMBER_OF_ARGUMENTS_DOESNT_MATCH;
     extern const int SAMPLING_NOT_SUPPORTED;
     extern const int ALTER_OF_COLUMN_IS_FORBIDDEN;
@@ -88,6 +87,20 @@ namespace ErrorCodes
     extern const int LOGICAL_ERROR;
 }
 
+StorageMerge::DatabaseNameOrRegexp::DatabaseNameOrRegexp(
+    const String & source_database_name_or_regexp_,
+    bool database_is_regexp_,
+    std::optional<OptimizedRegularExpression> source_database_regexp_,
+    std::optional<OptimizedRegularExpression> source_table_regexp_,
+    std::optional<DBToTableSetMap> source_databases_and_tables_)
+    : source_database_name_or_regexp(source_database_name_or_regexp_)
+    , database_is_regexp(database_is_regexp_)
+    , source_database_regexp(std::move(source_database_regexp_))
+    , source_table_regexp(std::move(source_table_regexp_))
+    , source_databases_and_tables(std::move(source_databases_and_tables_))
+{
+}
+
 StorageMerge::StorageMerge(
     const StorageID & table_id_,
     const ColumnsDescription & columns_,
@@ -98,10 +111,11 @@ StorageMerge::StorageMerge(
     ContextPtr context_)
     : IStorage(table_id_)
     , WithContext(context_->getGlobalContext())
-    , source_database_regexp(source_database_name_or_regexp_)
-    , source_databases_and_tables(source_databases_and_tables_)
-    , source_database_name_or_regexp(source_database_name_or_regexp_)
-    , database_is_regexp(database_is_regexp_)
+    , database_name_or_regexp(
+        source_database_name_or_regexp_,
+        database_is_regexp_,
+        source_database_name_or_regexp_, {},
+        source_databases_and_tables_)
 {
     StorageInMemoryMetadata storage_metadata;
     storage_metadata.setColumns(columns_.empty() ? getColumnsDescriptionFromSourceTables() : columns_);
@@ -119,10 +133,11 @@ StorageMerge::StorageMerge(
     ContextPtr context_)
     : IStorage(table_id_)
     , WithContext(context_->getGlobalContext())
-    , source_database_regexp(source_database_name_or_regexp_)
-    , source_table_regexp(source_table_regexp_)
-    , source_database_name_or_regexp(source_database_name_or_regexp_)
-    , database_is_regexp(database_is_regexp_)
+    , database_name_or_regexp(
+        source_database_name_or_regexp_,
+        database_is_regexp_,
+        source_database_name_or_regexp_,
+        source_table_regexp_, {})
 {
     StorageInMemoryMetadata storage_metadata;
     storage_metadata.setColumns(columns_.empty() ? getColumnsDescriptionFromSourceTables() : columns_);
@@ -130,6 +145,11 @@ StorageMerge::StorageMerge(
     setInMemoryMetadata(storage_metadata);
 }
 
+StorageMerge::DatabaseTablesIterators StorageMerge::getDatabaseIterators(ContextPtr context_) const
+{
+    return database_name_or_regexp.getDatabaseIterators(context_);
+}
+
 ColumnsDescription StorageMerge::getColumnsDescriptionFromSourceTables() const
 {
     auto table = getFirstTable([](auto && t) { return t; });
@@ -141,7 +161,7 @@ ColumnsDescription StorageMerge::getColumnsDescriptionFromSourceTables() const
 template <typename F>
 StoragePtr StorageMerge::getFirstTable(F && predicate) const
 {
-    auto database_table_iterators = getDatabaseIterators(getContext());
+    auto database_table_iterators = database_name_or_regexp.getDatabaseIterators(getContext());
 
     for (auto & iterator : database_table_iterators)
     {
@@ -236,29 +256,6 @@ std::optional<NameSet> StorageMerge::supportedPrewhereColumns() const
     return supported_columns;
 }
 
-bool StorageMerge::mayBenefitFromIndexForIn(const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & /*metadata_snapshot*/) const
-{
-    /// It's beneficial if it is true for at least one table.
-    StorageListWithLocks selected_tables = getSelectedTables(query_context);
-
-    size_t i = 0;
-    for (const auto & table : selected_tables)
-    {
-        const auto & storage_ptr = std::get<1>(table);
-        auto metadata_snapshot = storage_ptr->getInMemoryMetadataPtr();
-        if (storage_ptr->mayBenefitFromIndexForIn(left_in_operand, query_context, metadata_snapshot))
-            return true;
-
-        ++i;
-        /// For simplicity reasons, check only first ten tables.
-        if (i > 10)
-            break;
-    }
-
-    return false;
-}
-
-
 QueryProcessingStage::Enum StorageMerge::getQueryProcessingStage(
     ContextPtr local_context,
     QueryProcessingStage::Enum to_stage,
@@ -277,7 +274,7 @@ QueryProcessingStage::Enum StorageMerge::getQueryProcessingStage(
 
     auto stage_in_source_tables = QueryProcessingStage::FetchColumns;
 
-    DatabaseTablesIterators database_table_iterators = getDatabaseIterators(local_context);
+    DatabaseTablesIterators database_table_iterators = database_name_or_regexp.getDatabaseIterators(local_context);
 
     size_t selected_table_size = 0;
 
@@ -319,45 +316,6 @@ void StorageMerge::read(
       */
     auto modified_context = Context::createCopy(local_context);
     modified_context->setSetting("optimize_move_to_prewhere", false);
-
-    bool has_database_virtual_column = false;
-    bool has_table_virtual_column = false;
-    Names real_column_names;
-    real_column_names.reserve(column_names.size());
-
-    for (const auto & column_name : column_names)
-    {
-        if (column_name == "_database" && isVirtualColumn(column_name, storage_snapshot->metadata))
-            has_database_virtual_column = true;
-        else if (column_name == "_table" && isVirtualColumn(column_name, storage_snapshot->metadata))
-            has_table_virtual_column = true;
-        else
-            real_column_names.push_back(column_name);
-    }
-
-    StorageListWithLocks selected_tables
-        = getSelectedTables(modified_context, query_info.query, has_database_virtual_column, has_table_virtual_column);
-
-    InputOrderInfoPtr input_sorting_info;
-    if (query_info.order_optimizer)
-    {
-        for (auto it = selected_tables.begin(); it != selected_tables.end(); ++it)
-        {
-            auto storage_ptr = std::get<1>(*it);
-            auto storage_metadata_snapshot = storage_ptr->getInMemoryMetadataPtr();
-            auto current_info = query_info.order_optimizer->getInputOrder(storage_metadata_snapshot, modified_context);
-            if (it == selected_tables.begin())
-                input_sorting_info = current_info;
-            else if (!current_info || (input_sorting_info && *current_info != *input_sorting_info))
-                input_sorting_info.reset();
-
-            if (!input_sorting_info)
-                break;
-        }
-
-        query_info.input_order_info = input_sorting_info;
-    }
-
     query_plan.addInterpreterContext(modified_context);
 
     /// What will be result structure depending on query processed stage in source tables?
@@ -365,10 +323,7 @@ void StorageMerge::read(
 
     auto step = std::make_unique<ReadFromMerge>(
         common_header,
-        std::move(selected_tables),
-        real_column_names,
-        has_database_virtual_column,
-        has_table_virtual_column,
+        column_names,
         max_block_size,
         num_streams,
         shared_from_this(),
@@ -380,43 +335,9 @@ void StorageMerge::read(
     query_plan.addStep(std::move(step));
 }
 
-/// An object of this helper class is created
-///  when processing a Merge table data source (subordinary table)
-///  that has row policies
-///  to guarantee that these row policies are applied
-class ReadFromMerge::RowPolicyData
-{
-public:
-    RowPolicyData(RowPolicyFilterPtr, std::shared_ptr<DB::IStorage>, ContextPtr);
-
-    /// Add to data stream columns that are needed only for row policies
-    ///  SELECT x from T  if  T has row policy  y=42
-    ///  required y in data pipeline
-    void extendNames(Names &) const;
-
-    /// Use storage facilities to filter data
-    ///  optimization
-    ///  does not guarantee accuracy, but reduces number of rows
-    void addStorageFilter(SourceStepWithFilter *) const;
-
-    /// Create explicit filter transform to exclude
-    /// rows that are not conform to row level policy
-    void addFilterTransform(QueryPipelineBuilder &) const;
-
-private:
-    std::string filter_column_name; // complex filter, may contain logic operations
-    ActionsDAGPtr actions_dag;
-    ExpressionActionsPtr filter_actions;
-    StorageMetadataPtr storage_metadata_snapshot;
-};
-
-
 ReadFromMerge::ReadFromMerge(
     Block common_header_,
-    StorageListWithLocks selected_tables_,
-    Names column_names_,
-    bool has_database_virtual_column_,
-    bool has_table_virtual_column_,
+    Names all_column_names_,
     size_t max_block_size,
     size_t num_streams,
     StoragePtr storage,
@@ -428,21 +349,19 @@ ReadFromMerge::ReadFromMerge(
     , required_max_block_size(max_block_size)
     , requested_num_streams(num_streams)
     , common_header(std::move(common_header_))
-    , selected_tables(std::move(selected_tables_))
-    , column_names(std::move(column_names_))
-    , has_database_virtual_column(has_database_virtual_column_)
-    , has_table_virtual_column(has_table_virtual_column_)
+    , all_column_names(std::move(all_column_names_))
     , storage_merge(std::move(storage))
     , merge_storage_snapshot(std::move(storage_snapshot))
     , query_info(query_info_)
     , context(std::move(context_))
     , common_processed_stage(processed_stage)
 {
-    createChildPlans();
 }
 
 void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &)
 {
+    filterTablesAndCreateChildrenPlans();
+
     if (selected_tables.empty())
     {
         pipeline.init(Pipe(std::make_shared<NullSource>(output_stream->header)));
@@ -452,13 +371,10 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
     QueryPlanResourceHolder resources;
     std::vector<std::unique_ptr<QueryPipelineBuilder>> pipelines;
 
-    chassert(selected_tables.size() == child_plans.size());
-    chassert(selected_tables.size() == table_aliases.size());
-    chassert(selected_tables.size() == table_row_policy_data_opts.size());
     auto table_it = selected_tables.begin();
     for (size_t i = 0; i < selected_tables.size(); ++i, ++table_it)
     {
-        auto & plan = child_plans.at(i);
+        auto & child_plan = child_plans->at(i);
         const auto & table = *table_it;
 
         const auto storage = std::get<1>(table);
@@ -468,13 +384,13 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
         auto modified_query_info = getModifiedQueryInfo(query_info, context, table, nested_storage_snaphsot);
 
         auto source_pipeline = createSources(
-            plan,
+            child_plan.plan,
             nested_storage_snaphsot,
             modified_query_info,
             common_processed_stage,
             common_header,
-            table_aliases.at(i),
-            table_row_policy_data_opts.at(i),
+            child_plan.table_aliases,
+            child_plan.row_policy_data_opt,
             table,
             context);
 
@@ -512,10 +428,37 @@ void ReadFromMerge::initializePipeline(QueryPipelineBuilder & pipeline, const Bu
     pipeline.addResources(std::move(resources));
 }
 
-void ReadFromMerge::createChildPlans()
+void ReadFromMerge::filterTablesAndCreateChildrenPlans()
+{
+    if (child_plans)
+        return;
+
+    has_database_virtual_column = false;
+    has_table_virtual_column = false;
+    column_names.clear();
+    column_names.reserve(column_names.size());
+
+    for (const auto & column_name : all_column_names)
+    {
+        if (column_name == "_database" && storage_merge->isVirtualColumn(column_name, merge_storage_snapshot->metadata))
+            has_database_virtual_column = true;
+        else if (column_name == "_table" && storage_merge->isVirtualColumn(column_name, merge_storage_snapshot->metadata))
+            has_table_virtual_column = true;
+        else
+            column_names.push_back(column_name);
+    }
+
+    selected_tables = getSelectedTables(context, has_database_virtual_column, has_table_virtual_column);
+
+    child_plans = createChildrenPlans(query_info);
+}
+
+std::vector<ReadFromMerge::ChildPlan> ReadFromMerge::createChildrenPlans(SelectQueryInfo & query_info_) const
 {
     if (selected_tables.empty())
-        return;
+        return {};
+
+    std::vector<ChildPlan> res;
 
     size_t tables_count = selected_tables.size();
     Float64 num_streams_multiplier
@@ -525,7 +468,7 @@ void ReadFromMerge::createChildPlans()
 
     if (order_info)
     {
-        query_info.input_order_info = order_info;
+        query_info_.input_order_info = order_info;
     }
     else if (query_info.order_optimizer)
     {
@@ -544,7 +487,7 @@ void ReadFromMerge::createChildPlans()
                 break;
         }
 
-        query_info.input_order_info = input_sorting_info;
+        query_info_.input_order_info = input_sorting_info;
     }
 
     for (const auto & table : selected_tables)
@@ -564,8 +507,10 @@ void ReadFromMerge::createChildPlans()
         if (sampling_requested && !storage->supportsSampling())
             throw Exception(ErrorCodes::SAMPLING_NOT_SUPPORTED, "Illegal SAMPLE: table {} doesn't support sampling", storage->getStorageID().getNameForLogs());
 
-        auto & aliases = table_aliases.emplace_back();
-        auto & row_policy_data_opt = table_row_policy_data_opts.emplace_back();
+        res.emplace_back();
+
+        auto & aliases = res.back().table_aliases;
+        auto & row_policy_data_opt = res.back().row_policy_data_opt;
         auto storage_metadata_snapshot = storage->getInMemoryMetadataPtr();
         auto nested_storage_snaphsot = storage->getStorageSnapshot(storage_metadata_snapshot, context);
 
@@ -638,7 +583,7 @@ void ReadFromMerge::createChildPlans()
             }
         }
 
-        child_plans.emplace_back(createPlanForTable(
+        res.back().plan = createPlanForTable(
             nested_storage_snaphsot,
             modified_query_info,
             common_processed_stage,
@@ -647,8 +592,10 @@ void ReadFromMerge::createChildPlans()
             column_names_as_aliases.empty() ? std::move(real_column_names) : std::move(column_names_as_aliases),
             row_policy_data_opt,
             context,
-            current_streams));
+            current_streams);
     }
+
+    return res;
 }
 
 SelectQueryInfo ReadFromMerge::getModifiedQueryInfo(const SelectQueryInfo & query_info,
@@ -826,7 +773,7 @@ QueryPlan ReadFromMerge::createPlanForTable(
     Names && real_column_names,
     const RowPolicyDataOpt & row_policy_data_opt,
     ContextMutablePtr modified_context,
-    size_t streams_num)
+    size_t streams_num) const
 {
     const auto & [database_name, storage, _, table_name] = storage_with_lock;
 
@@ -989,21 +936,14 @@ void ReadFromMerge::RowPolicyData::addFilterTransform(QueryPipelineBuilder & bui
     });
 }
 
-StorageMerge::StorageListWithLocks StorageMerge::getSelectedTables(
+StorageMerge::StorageListWithLocks ReadFromMerge::getSelectedTables(
     ContextPtr query_context,
-    const ASTPtr & query /* = nullptr */,
-    bool filter_by_database_virtual_column /* = false */,
-    bool filter_by_table_virtual_column /* = false */) const
+    bool filter_by_database_virtual_column,
+    bool filter_by_table_virtual_column) const
 {
-    /// FIXME: filtering does not work with allow_experimental_analyzer due to
-    /// different column names there (it has "table_name._table" not just
-    /// "_table")
-
-    assert(!filter_by_database_virtual_column || !filter_by_table_virtual_column || query);
-
     const Settings & settings = query_context->getSettingsRef();
-    StorageListWithLocks selected_tables;
-    DatabaseTablesIterators database_table_iterators = getDatabaseIterators(getContext());
+    StorageListWithLocks res;
+    DatabaseTablesIterators database_table_iterators = assert_cast<StorageMerge &>(*storage_merge).getDatabaseIterators(query_context);
 
     MutableColumnPtr database_name_virtual_column;
     MutableColumnPtr table_name_virtual_column;
@@ -1027,13 +967,10 @@ StorageMerge::StorageListWithLocks StorageMerge::getSelectedTables(
             if (!storage)
                 continue;
 
-            if (query && query->as<ASTSelectQuery>()->prewhere() && !storage->supportsPrewhere())
-                throw Exception(ErrorCodes::ILLEGAL_PREWHERE, "Storage {} doesn't support PREWHERE.", storage->getName());
-
-            if (storage.get() != this)
+            if (storage.get() != storage_merge.get())
             {
                 auto table_lock = storage->lockForShare(query_context->getCurrentQueryId(), settings.lock_acquire_timeout);
-                selected_tables.emplace_back(iterator->databaseName(), storage, std::move(table_lock), iterator->name());
+                res.emplace_back(iterator->databaseName(), storage, std::move(table_lock), iterator->name());
                 if (filter_by_table_virtual_column)
                     table_name_virtual_column->insert(iterator->name());
             }
@@ -1042,33 +979,42 @@ StorageMerge::StorageListWithLocks StorageMerge::getSelectedTables(
         }
     }
 
+    if (!filter_by_database_virtual_column && !filter_by_table_virtual_column)
+        return res;
+
+    auto filter_actions_dag = ActionsDAG::buildFilterActionsDAG(filter_nodes.nodes, {}, context);
+    if (!filter_actions_dag)
+        return res;
+
+    const auto * predicate = filter_actions_dag->getOutputs().at(0);
+
     if (filter_by_database_virtual_column)
     {
         /// Filter names of selected tables if there is a condition on "_database" virtual column in WHERE clause
         Block virtual_columns_block
             = Block{ColumnWithTypeAndName(std::move(database_name_virtual_column), std::make_shared<DataTypeString>(), "_database")};
-        VirtualColumnUtils::filterBlockWithQuery(query, virtual_columns_block, query_context);
+        VirtualColumnUtils::filterBlockWithPredicate(predicate, virtual_columns_block, query_context);
         auto values = VirtualColumnUtils::extractSingleValueFromBlock<String>(virtual_columns_block, "_database");
 
         /// Remove unused databases from the list
-        selected_tables.remove_if([&](const auto & elem) { return values.find(std::get<0>(elem)) == values.end(); });
+        res.remove_if([&](const auto & elem) { return values.find(std::get<0>(elem)) == values.end(); });
     }
 
     if (filter_by_table_virtual_column)
     {
         /// Filter names of selected tables if there is a condition on "_table" virtual column in WHERE clause
         Block virtual_columns_block = Block{ColumnWithTypeAndName(std::move(table_name_virtual_column), std::make_shared<DataTypeString>(), "_table")};
-        VirtualColumnUtils::filterBlockWithQuery(query, virtual_columns_block, query_context);
+        VirtualColumnUtils::filterBlockWithPredicate(predicate, virtual_columns_block, query_context);
         auto values = VirtualColumnUtils::extractSingleValueFromBlock<String>(virtual_columns_block, "_table");
 
         /// Remove unused tables from the list
-        selected_tables.remove_if([&](const auto & elem) { return values.find(std::get<3>(elem)) == values.end(); });
+        res.remove_if([&](const auto & elem) { return values.find(std::get<3>(elem)) == values.end(); });
     }
 
-    return selected_tables;
+    return res;
 }
 
-DatabaseTablesIteratorPtr StorageMerge::getDatabaseIterator(const String & database_name, ContextPtr local_context) const
+DatabaseTablesIteratorPtr StorageMerge::DatabaseNameOrRegexp::getDatabaseIterator(const String & database_name, ContextPtr local_context) const
 {
     auto database = DatabaseCatalog::instance().getDatabase(database_name);
 
@@ -1088,7 +1034,7 @@ DatabaseTablesIteratorPtr StorageMerge::getDatabaseIterator(const String & datab
     return database->getTablesIterator(local_context, table_name_match);
 }
 
-StorageMerge::DatabaseTablesIterators StorageMerge::getDatabaseIterators(ContextPtr local_context) const
+StorageMerge::DatabaseTablesIterators StorageMerge::DatabaseNameOrRegexp::getDatabaseIterators(ContextPtr local_context) const
 {
     try
     {
@@ -1213,8 +1159,16 @@ void ReadFromMerge::convertAndFilterSourceStream(
     });
 }
 
+const ReadFromMerge::StorageListWithLocks & ReadFromMerge::getSelectedTables()
+{
+    filterTablesAndCreateChildrenPlans();
+    return selected_tables;
+}
+
 bool ReadFromMerge::requestReadingInOrder(InputOrderInfoPtr order_info_)
 {
+    filterTablesAndCreateChildrenPlans();
+
     /// Disable read-in-order optimization for reverse order with final.
     /// Otherwise, it can lead to incorrect final behavior because the implementation may rely on the reading in direct order).
     if (order_info_->direction != 1 && InterpreterSelectQuery::isQueryWithFinal(query_info))
@@ -1227,9 +1181,9 @@ bool ReadFromMerge::requestReadingInOrder(InputOrderInfoPtr order_info_)
     };
 
     bool ok = true;
-    for (const auto & plan : child_plans)
-        if (plan.isInitialized())
-            ok &= recursivelyApplyToReadingSteps(plan.getRootNode(), request_read_in_order);
+    for (const auto & child_plan : *child_plans)
+        if (child_plan.plan.isInitialized())
+            ok &= recursivelyApplyToReadingSteps(child_plan.plan.getRootNode(), request_read_in_order);
 
     if (!ok)
         return false;
@@ -1256,9 +1210,11 @@ void ReadFromMerge::applyFilters(const QueryPlan & plan) const
 
 void ReadFromMerge::applyFilters()
 {
-    for (const auto & plan : child_plans)
-        if (plan.isInitialized())
-            applyFilters(plan);
+    filterTablesAndCreateChildrenPlans();
+
+    for (const auto & child_plan : *child_plans)
+        if (child_plan.plan.isInitialized())
+            applyFilters(child_plan.plan);
 }
 
 IStorage::ColumnSizeByName StorageMerge::getColumnSizes() const
@@ -1293,6 +1249,37 @@ std::tuple<bool /* is_regexp */, ASTPtr> StorageMerge::evaluateDatabaseName(cons
     return {false, ast};
 }
 
+bool StorageMerge::supportsTrivialCountOptimization() const
+{
+    return getFirstTable([&](const auto & table) { return !table->supportsTrivialCountOptimization(); }) == nullptr;
+}
+
+std::optional<UInt64> StorageMerge::totalRows(const Settings & settings) const
+{
+    return totalRowsOrBytes([&](const auto & table) { return table->totalRows(settings); });
+}
+
+std::optional<UInt64> StorageMerge::totalBytes(const Settings & settings) const
+{
+    return totalRowsOrBytes([&](const auto & table) { return table->totalBytes(settings); });
+}
+
+template <typename F>
+std::optional<UInt64> StorageMerge::totalRowsOrBytes(F && func) const
+{
+    UInt64 total_rows_or_bytes = 0;
+    auto first_table = getFirstTable([&](const auto & table)
+    {
+        if (auto rows_or_bytes = func(table))
+        {
+            total_rows_or_bytes += *rows_or_bytes;
+            return false;
+        }
+        return true;
+    });
+
+    return first_table ? std::nullopt : std::make_optional(total_rows_or_bytes);
+}
 
 void registerStorageMerge(StorageFactory & factory)
 {
diff --git a/src/Storages/StorageMerge.h b/src/Storages/StorageMerge.h
index ea682a6255e..703e5db9c50 100644
--- a/src/Storages/StorageMerge.h
+++ b/src/Storages/StorageMerge.h
@@ -12,6 +12,9 @@ namespace DB
 
 struct QueryPlanResourceHolder;
 
+struct RowPolicyFilter;
+using RowPolicyFilterPtr = std::shared_ptr<const RowPolicyFilter>;
+
 /** A table that represents the union of an arbitrary number of other tables.
   * All tables must have the same structure.
   */
@@ -45,7 +48,6 @@ public:
     /// The check is delayed to the read method. It checks the support of the tables used.
     bool supportsSampling() const override { return true; }
     bool supportsFinal() const override { return true; }
-    bool supportsIndexForIn() const override { return true; }
     bool supportsSubcolumns() const override { return true; }
     bool supportsPrewhere() const override { return true; }
     std::optional<NameSet> supportedPrewhereColumns() const override;
@@ -71,30 +73,44 @@ public:
     /// the structure of sub-tables is not checked
     void alter(const AlterCommands & params, ContextPtr context, AlterLockHolder & table_lock_holder) override;
 
-    bool mayBenefitFromIndexForIn(
-        const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & metadata_snapshot) const override;
-
     /// Evaluate database name or regexp for StorageMerge and TableFunction merge
     static std::tuple<bool /* is_regexp */, ASTPtr> evaluateDatabaseName(const ASTPtr & node, ContextPtr context);
 
+    bool supportsTrivialCountOptimization() const override;
+
+    std::optional<UInt64> totalRows(const Settings & settings) const override;
+    std::optional<UInt64> totalBytes(const Settings & settings) const override;
+
+    using DatabaseTablesIterators = std::vector<DatabaseTablesIteratorPtr>;
+    DatabaseTablesIterators getDatabaseIterators(ContextPtr context) const;
+
 private:
-    std::optional<OptimizedRegularExpression> source_database_regexp;
-    std::optional<OptimizedRegularExpression> source_table_regexp;
-    std::optional<DBToTableSetMap> source_databases_and_tables;
-
-    String source_database_name_or_regexp;
-    bool database_is_regexp = false;
-
     /// (Database, Table, Lock, TableName)
     using StorageWithLockAndName = std::tuple<String, StoragePtr, TableLockHolder, String>;
     using StorageListWithLocks = std::list<StorageWithLockAndName>;
-    using DatabaseTablesIterators = std::vector<DatabaseTablesIteratorPtr>;
 
-    StorageMerge::StorageListWithLocks getSelectedTables(
-        ContextPtr query_context,
-        const ASTPtr & query = nullptr,
-        bool filter_by_database_virtual_column = false,
-        bool filter_by_table_virtual_column = false) const;
+    struct DatabaseNameOrRegexp
+    {
+        String source_database_name_or_regexp;
+        bool database_is_regexp = false;
+
+        std::optional<OptimizedRegularExpression> source_database_regexp;
+        std::optional<OptimizedRegularExpression> source_table_regexp;
+        std::optional<DBToTableSetMap> source_databases_and_tables;
+
+        DatabaseNameOrRegexp(
+            const String & source_database_name_or_regexp_,
+            bool database_is_regexp_,
+            std::optional<OptimizedRegularExpression> source_database_regexp_,
+            std::optional<OptimizedRegularExpression> source_table_regexp_,
+            std::optional<DBToTableSetMap> source_databases_and_tables_);
+
+        DatabaseTablesIteratorPtr getDatabaseIterator(const String & database_name, ContextPtr context) const;
+
+        DatabaseTablesIterators getDatabaseIterators(ContextPtr context) const;
+    };
+
+    DatabaseNameOrRegexp database_name_or_regexp;
 
     template <typename F>
     StoragePtr getFirstTable(F && predicate) const;
@@ -102,10 +118,6 @@ private:
     template <typename F>
     void forEachTable(F && func) const;
 
-    DatabaseTablesIteratorPtr getDatabaseIterator(const String & database_name, ContextPtr context) const;
-
-    DatabaseTablesIterators getDatabaseIterators(ContextPtr context) const;
-
     NamesAndTypesList getVirtuals() const override;
     ColumnSizeByName getColumnSizes() const override;
 
@@ -113,6 +125,9 @@ private:
 
     bool tableSupportsPrewhere() const;
 
+    template <typename F>
+    std::optional<UInt64> totalRowsOrBytes(F && func) const;
+
     friend class ReadFromMerge;
 };
 
@@ -128,10 +143,7 @@ public:
 
     ReadFromMerge(
         Block common_header_,
-        StorageListWithLocks selected_tables_,
-        Names column_names_,
-        bool has_database_virtual_column_,
-        bool has_table_virtual_column_,
+        Names all_column_names_,
         size_t max_block_size,
         size_t num_streams,
         StoragePtr storage,
@@ -142,7 +154,7 @@ public:
 
     void initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &) override;
 
-    const StorageListWithLocks & getSelectedTables() const { return selected_tables; }
+    const StorageListWithLocks & getSelectedTables();
 
     /// Returns `false` if requested reading cannot be performed.
     bool requestReadingInOrder(InputOrderInfoPtr order_info_);
@@ -155,16 +167,13 @@ private:
     const Block common_header;
 
     StorageListWithLocks selected_tables;
+    Names all_column_names;
     Names column_names;
     bool has_database_virtual_column;
     bool has_table_virtual_column;
     StoragePtr storage_merge;
     StorageSnapshotPtr merge_storage_snapshot;
 
-    /// Store read plan for each child table.
-    /// It's needed to guarantee lifetime for child steps to be the same as for this step (mainly for EXPLAIN PIPELINE).
-    std::vector<QueryPlan> child_plans;
-
     SelectQueryInfo query_info;
     ContextMutablePtr context;
     QueryProcessingStage::Enum common_processed_stage;
@@ -180,14 +189,52 @@ private:
 
     using Aliases = std::vector<AliasData>;
 
-    class RowPolicyData;
+    /// An object of this helper class is created
+    ///  when processing a Merge table data source (subordinary table)
+    ///  that has row policies
+    ///  to guarantee that these row policies are applied
+    class RowPolicyData
+    {
+    public:
+        RowPolicyData(RowPolicyFilterPtr, std::shared_ptr<DB::IStorage>, ContextPtr);
+
+        /// Add to data stream columns that are needed only for row policies
+        ///  SELECT x from T  if  T has row policy  y=42
+        ///  required y in data pipeline
+        void extendNames(Names &) const;
+
+        /// Use storage facilities to filter data
+        ///  optimization
+        ///  does not guarantee accuracy, but reduces number of rows
+        void addStorageFilter(SourceStepWithFilter *) const;
+
+        /// Create explicit filter transform to exclude
+        /// rows that are not conform to row level policy
+        void addFilterTransform(QueryPipelineBuilder &) const;
+
+    private:
+        std::string filter_column_name; // complex filter, may contain logic operations
+        ActionsDAGPtr actions_dag;
+        ExpressionActionsPtr filter_actions;
+        StorageMetadataPtr storage_metadata_snapshot;
+    };
+
     using RowPolicyDataOpt = std::optional<RowPolicyData>;
 
-    std::vector<Aliases> table_aliases;
+    struct ChildPlan
+    {
+        QueryPlan plan;
+        Aliases table_aliases;
+        RowPolicyDataOpt row_policy_data_opt;
+    };
 
-    std::vector<RowPolicyDataOpt> table_row_policy_data_opts;
+    /// Store read plan for each child table.
+    /// It's needed to guarantee lifetime for child steps to be the same as for this step (mainly for EXPLAIN PIPELINE).
+    std::optional<std::vector<ChildPlan>> child_plans;
 
-    void createChildPlans();
+    std::vector<ChildPlan> createChildrenPlans(SelectQueryInfo & query_info_) const;
+
+    void filterTablesAndCreateChildrenPlans();
 
     void applyFilters(const QueryPlan & plan) const;
 
@@ -200,7 +247,7 @@ private:
         Names && real_column_names,
         const RowPolicyDataOpt & row_policy_data_opt,
         ContextMutablePtr modified_context,
-        size_t streams_num);
+        size_t streams_num) const;
 
     QueryPipelineBuilderPtr createSources(
         QueryPlan & plan,
@@ -227,6 +274,11 @@ private:
         ContextPtr context,
         QueryPipelineBuilder & builder,
         QueryProcessingStage::Enum processed_stage);
+
+    StorageMerge::StorageListWithLocks getSelectedTables(
+        ContextPtr query_context,
+        bool filter_by_database_virtual_column,
+        bool filter_by_table_virtual_column) const;
 };
 
 }
diff --git a/src/Storages/StorageMergeTree.cpp b/src/Storages/StorageMergeTree.cpp
index e9a0dd5fbf3..e7ca50f4a5c 100644
--- a/src/Storages/StorageMergeTree.cpp
+++ b/src/Storages/StorageMergeTree.cpp
@@ -8,6 +8,7 @@
 #include <base/sort.h>
 #include <Backups/BackupEntriesCollector.h>
 #include <Databases/IDatabase.h>
+#include "Common/Exception.h"
 #include <Common/MemoryTracker.h>
 #include <Common/escapeForFileName.h>
 #include <Common/ProfileEventsScope.h>
@@ -61,6 +62,7 @@ namespace ErrorCodes
     extern const int UNKNOWN_POLICY;
     extern const int NO_SUCH_DATA_PART;
     extern const int ABORTED;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 namespace ActionLocks
@@ -211,17 +213,12 @@ void StorageMergeTree::read(
 {
     if (local_context->canUseParallelReplicasOnInitiator() && local_context->getSettingsRef().parallel_replicas_for_non_replicated_merge_tree)
     {
-        auto table_id = getStorageID();
-
+        const auto table_id = getStorageID();
         const auto & modified_query_ast =  ClusterProxy::rewriteSelectQuery(
             local_context, query_info.query,
             table_id.database_name, table_id.table_name, /*remote_table_function_ptr*/nullptr);
 
-        String cluster_for_parallel_replicas = local_context->getSettingsRef().cluster_for_parallel_replicas;
-        auto cluster = local_context->getCluster(cluster_for_parallel_replicas);
-
         Block header;
-
         if (local_context->getSettingsRef().allow_experimental_analyzer)
             header = InterpreterSelectQueryAnalyzer::getSampleBlock(modified_query_ast, local_context, SelectQueryOptions(processed_stage).analyze());
         else
@@ -240,17 +237,22 @@ void StorageMergeTree::read(
             select_stream_factory,
             modified_query_ast,
             local_context,
-            query_info.storage_limits,
-            cluster);
+            query_info.storage_limits);
     }
     else
     {
         const bool enable_parallel_reading = local_context->canUseParallelReplicasOnFollower() && local_context->getSettingsRef().parallel_replicas_for_non_replicated_merge_tree;
 
         if (auto plan = reader.read(
-            column_names, storage_snapshot, query_info,
-            local_context, max_block_size, num_streams,
-            processed_stage, nullptr, enable_parallel_reading))
+                column_names,
+                storage_snapshot,
+                query_info,
+                local_context,
+                max_block_size,
+                num_streams,
+                processed_stage,
+                nullptr,
+                enable_parallel_reading))
             query_plan = std::move(*plan);
     }
 }
@@ -271,6 +273,15 @@ std::optional<UInt64> StorageMergeTree::totalBytes(const Settings &) const
     return getTotalActiveSizeInBytes();
 }
 
+std::optional<UInt64> StorageMergeTree::totalBytesUncompressed(const Settings &) const
+{
+    UInt64 res = 0;
+    auto parts = getDataPartsForInternalUsage();
+    for (const auto & part : parts)
+        res += part->getBytesUncompressedOnDisk();
+    return res;
+}
+
 SinkToStoragePtr
 StorageMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & metadata_snapshot, ContextPtr local_context, bool /*async_insert*/)
 {
@@ -279,12 +290,20 @@ StorageMergeTree::write(const ASTPtr & /*query*/, const StorageMetadataPtr & met
         *this, metadata_snapshot, settings.max_partitions_per_insert_block, local_context);
 }
 
-void StorageMergeTree::checkTableCanBeDropped([[ maybe_unused ]] ContextPtr query_context) const
+void StorageMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 {
     if (!supportsReplication() && isStaticStorage())
         return;
 
     auto table_id = getStorageID();
+
+    const auto & query_settings = query_context->getSettingsRef();
+    if (query_settings.max_table_size_to_drop.changed)
+    {
+        getContext()->checkTableCanBeDropped(table_id.database_name, table_id.table_name, getTotalActiveSizeInBytes(), query_settings.max_table_size_to_drop);
+        return;
+    }
+
     getContext()->checkTableCanBeDropped(table_id.database_name, table_id.table_name, getTotalActiveSizeInBytes());
 }
 
@@ -829,8 +848,13 @@ void StorageMergeTree::loadDeduplicationLog()
 
     auto disk = getDisks()[0];
     std::string path = fs::path(relative_data_path) / "deduplication_logs";
-    deduplication_log = std::make_unique<MergeTreeDeduplicationLog>(path, settings->non_replicated_deduplication_window, format_version, disk);
-    deduplication_log->load();
+
+    /// If either there is already a deduplication log, or we will be able to use it.
+    if (disk->exists(path) || !disk->isReadOnly())
+    {
+        deduplication_log = std::make_unique<MergeTreeDeduplicationLog>(path, settings->non_replicated_deduplication_window, format_version, disk);
+        deduplication_log->load();
+    }
 }
 
 void StorageMergeTree::loadMutations()
@@ -1507,6 +1531,9 @@ bool StorageMergeTree::optimize(
             throw Exception(ErrorCodes::CANNOT_ASSIGN_OPTIMIZE, message, disable_reason);
         }
 
+        if (cleanup && !getSettings()->allow_experimental_replacing_merge_with_cleanup)
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Experimental merges with CLEANUP are not allowed");
+
         DataPartsVector data_parts = getVisibleDataPartsVector(local_context);
         std::unordered_set<String> partition_ids;
 
@@ -2138,7 +2165,12 @@ void StorageMergeTree::movePartitionToTable(const StoragePtr & dest_table, const
         Int64 temp_index = insert_increment.get();
         MergeTreePartInfo dst_part_info(partition_id, temp_index, temp_index, src_part->info.level);
 
-        IDataPartStorage::ClonePartParams clone_params{.txn = local_context->getCurrentTransaction()};
+        IDataPartStorage::ClonePartParams clone_params
+        {
+            .txn = local_context->getCurrentTransaction(),
+            .copy_instead_of_hardlink = getSettings()->always_use_copy_instead_of_hardlinks,
+        };
+
         auto [dst_part, part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(
             src_part,
             TMP_PREFIX,
@@ -2148,6 +2180,7 @@ void StorageMergeTree::movePartitionToTable(const StoragePtr & dest_table, const
             local_context->getReadSettings(),
             local_context->getWriteSettings()
         );
+
         dst_parts.emplace_back(std::move(dst_part));
         dst_parts_locks.emplace_back(std::move(part_lock));
     }
diff --git a/src/Storages/StorageMergeTree.h b/src/Storages/StorageMergeTree.h
index 539037a90ae..b2829ecb17f 100644
--- a/src/Storages/StorageMergeTree.h
+++ b/src/Storages/StorageMergeTree.h
@@ -53,8 +53,6 @@ public:
 
     bool supportsParallelInsert() const override { return true; }
 
-    bool supportsIndexForIn() const override { return true; }
-
     bool supportsTransactions() const override { return true; }
 
     void read(
@@ -70,6 +68,7 @@ public:
     std::optional<UInt64> totalRows(const Settings &) const override;
     std::optional<UInt64> totalRowsByPartitionPredicate(const SelectQueryInfo &, ContextPtr) const override;
     std::optional<UInt64> totalBytes(const Settings &) const override;
+    std::optional<UInt64> totalBytesUncompressed(const Settings &) const override;
 
     SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
diff --git a/src/Storages/StoragePostgreSQL.cpp b/src/Storages/StoragePostgreSQL.cpp
index 7961c44e844..8fe2a161dba 100644
--- a/src/Storages/StoragePostgreSQL.cpp
+++ b/src/Storages/StoragePostgreSQL.cpp
@@ -8,6 +8,7 @@
 #include <Common/parseRemoteDescription.h>
 #include <Common/logger_useful.h>
 #include <Common/NamedCollections/NamedCollections.h>
+#include <Common/thread_local_rng.h>
 
 #include <Core/Settings.h>
 #include <Core/PostgreSQL/PoolWithFailover.h>
@@ -456,7 +457,7 @@ SinkToStoragePtr StoragePostgreSQL::write(
     return std::make_shared<PostgreSQLSink>(metadata_snapshot, pool->get(), remote_table_name, remote_table_schema, on_conflict);
 }
 
-StoragePostgreSQL::Configuration StoragePostgreSQL::processNamedCollectionResult(const NamedCollection & named_collection, bool require_table)
+StoragePostgreSQL::Configuration StoragePostgreSQL::processNamedCollectionResult(const NamedCollection & named_collection, ContextPtr context_, bool require_table)
 {
     StoragePostgreSQL::Configuration configuration;
     ValidateKeysMultiset<ExternalDatabaseEqualKeysSet> required_arguments = {"user", "username", "password", "database", "db"};
@@ -473,6 +474,12 @@ StoragePostgreSQL::Configuration StoragePostgreSQL::processNamedCollectionResult
         configuration.port = static_cast<UInt16>(named_collection.get<UInt64>("port"));
         configuration.addresses = {std::make_pair(configuration.host, configuration.port)};
     }
+    else
+    {
+        size_t max_addresses = context_->getSettingsRef().glob_expansion_max_elements;
+        configuration.addresses = parseRemoteDescriptionForExternalDatabase(
+            configuration.addresses_expr, max_addresses, 5432);
+    }
 
     configuration.username = named_collection.getAny<String>({"username", "user"});
     configuration.password = named_collection.get<String>("password");
@@ -490,7 +497,7 @@ StoragePostgreSQL::Configuration StoragePostgreSQL::getConfiguration(ASTs engine
     StoragePostgreSQL::Configuration configuration;
     if (auto named_collection = tryGetNamedCollectionWithOverrides(engine_args, context))
     {
-        configuration = StoragePostgreSQL::processNamedCollectionResult(*named_collection);
+        configuration = StoragePostgreSQL::processNamedCollectionResult(*named_collection, context);
     }
     else
     {
diff --git a/src/Storages/StoragePostgreSQL.h b/src/Storages/StoragePostgreSQL.h
index fb8b5a22df2..725a935aa46 100644
--- a/src/Storages/StoragePostgreSQL.h
+++ b/src/Storages/StoragePostgreSQL.h
@@ -65,7 +65,7 @@ public:
 
     static Configuration getConfiguration(ASTs engine_args, ContextPtr context);
 
-    static Configuration processNamedCollectionResult(const NamedCollection & named_collection, bool require_table = true);
+    static Configuration processNamedCollectionResult(const NamedCollection & named_collection, ContextPtr context_, bool require_table = true);
 
     static ColumnsDescription getTableStructureFromData(
         const postgres::PoolWithFailoverPtr & pool_,
diff --git a/src/Storages/StorageProxy.h b/src/Storages/StorageProxy.h
index 5d57f75a620..269ddf57fa2 100644
--- a/src/Storages/StorageProxy.h
+++ b/src/Storages/StorageProxy.h
@@ -143,12 +143,6 @@ public:
 
     ActionLock getActionLock(StorageActionBlockType action_type) override { return getNested()->getActionLock(action_type); }
 
-    bool supportsIndexForIn() const override { return getNested()->supportsIndexForIn(); }
-    bool mayBenefitFromIndexForIn(const ASTPtr & left_in_operand, ContextPtr query_context, const StorageMetadataPtr & metadata_snapshot) const override
-    {
-        return getNested()->mayBenefitFromIndexForIn(left_in_operand, query_context, metadata_snapshot);
-    }
-
     DataValidationTasksPtr getCheckTaskList(const CheckTaskFilter & check_task_filter, ContextPtr context) override
     {
         return getNested()->getCheckTaskList(check_task_filter, context);
diff --git a/src/Storages/StorageReplicatedMergeTree.cpp b/src/Storages/StorageReplicatedMergeTree.cpp
index 8114db9241f..eefcab01236 100644
--- a/src/Storages/StorageReplicatedMergeTree.cpp
+++ b/src/Storages/StorageReplicatedMergeTree.cpp
@@ -190,6 +190,7 @@ namespace ErrorCodes
     extern const int TOO_LARGE_DISTRIBUTED_DEPTH;
     extern const int TABLE_IS_DROPPED;
     extern const int CANNOT_BACKUP_TABLE;
+    extern const int SUPPORT_IS_DISABLED;
 }
 
 namespace ActionLocks
@@ -264,7 +265,7 @@ String StorageReplicatedMergeTree::getEndpointName() const
 
 static ConnectionTimeouts getHTTPTimeouts(ContextPtr context)
 {
-    return ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), {context->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0});
+    return ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), context->getServerSettings().keep_alive_timeout);
 }
 
 static MergeTreePartInfo makeDummyDropRangeForMovePartitionOrAttachPartitionFrom(const String & partition_id)
@@ -1349,12 +1350,8 @@ bool StorageReplicatedMergeTree::checkTableStructure(const String & zookeeper_pr
     Coordination::Stat columns_stat;
     auto columns_from_zk = ColumnsDescription::parse(zookeeper->get(fs::path(zookeeper_prefix) / "columns", &columns_stat));
 
-    const auto & old_columns = metadata_snapshot->getColumns();
-
-    /// Replicated tables on different replicas must have exactly same column definitions
-    /// We cannot compare column descriptions with `==` here because data types like SimpleAggregateFunction
-    /// may have different aggregate function in 1st argument but still compatible if 2nd argument is same.
-    if (columns_from_zk.identical(old_columns))
+    const ColumnsDescription & old_columns = metadata_snapshot->getColumns();
+    if (columns_from_zk == old_columns)
         return true;
 
     if (!strict_check && metadata_stat.version != 0)
@@ -1383,7 +1380,6 @@ void StorageReplicatedMergeTree::setTableStructure(const StorageID & table_id, c
     checkTTLExpressions(new_metadata, old_metadata);
     setProperties(new_metadata, old_metadata);
 
-
     DatabaseCatalog::instance().getDatabase(table_id.database_name)->alterTable(local_context, table_id, new_metadata);
 }
 
@@ -1839,9 +1835,13 @@ MergeTreeData::DataPartsVector StorageReplicatedMergeTree::checkPartChecksumsAnd
         return {};
     }
 
+    size_t retries_count = 0;
+    constexpr size_t MAX_RETRIES_ON_SHUTDOWN = 3;
     while (true)
     {
-        if (shutdown_called || partial_shutdown_called)
+        /// It still makes sense to make a few attempts on shutdown because we already did some job to create a part
+        /// and also we want to reduce the probability of issues with unexpected parts on restart
+        if (++retries_count > MAX_RETRIES_ON_SHUTDOWN && (shutdown_called || partial_shutdown_called))
             throw Exception(ErrorCodes::ABORTED, "Cannot commit part because shutdown called");
 
         Coordination::Requests ops;
@@ -1873,7 +1873,7 @@ MergeTreeData::DataPartsVector StorageReplicatedMergeTree::checkPartChecksumsAnd
             }
         }
 
-        throw zkutil::KeeperException(e);
+        throw zkutil::KeeperMultiException(e, ops, responses);
     }
 }
 
@@ -2693,7 +2693,7 @@ bool StorageReplicatedMergeTree::executeReplaceRange(LogEntry & entry)
 
             IDataPartStorage::ClonePartParams clone_params
             {
-                .copy_instead_of_hardlink = (our_zero_copy_enabled || source_zero_copy_enabled) && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport(),
+                .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || ((our_zero_copy_enabled || source_zero_copy_enabled) && part_desc->src_table_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
             auto [res_part, temporary_part_lock] = cloneAndLoadDataPartOnSameDisk(
@@ -2711,7 +2711,7 @@ bool StorageReplicatedMergeTree::executeReplaceRange(LogEntry & entry)
         {
             String source_replica_path = fs::path(zookeeper_path) / "replicas" / part_desc->replica;
             ReplicatedMergeTreeAddress address(getZooKeeper()->get(fs::path(source_replica_path) / "host"));
-            auto timeouts = getFetchPartHTTPTimeouts(getContext());
+            auto timeouts = ConnectionTimeouts::getFetchPartHTTPTimeouts(getContext()->getServerSettings(), getContext()->getSettingsRef());
 
             auto credentials = getContext()->getInterserverCredentials();
             String interserver_scheme = getContext()->getInterserverScheme();
@@ -3647,7 +3647,6 @@ void StorageReplicatedMergeTree::mergeSelectingTask()
     const auto storage_settings_ptr = getSettings();
     const bool deduplicate = false; /// TODO: read deduplicate option from table config
     const Names deduplicate_by_columns = {};
-    const bool cleanup = (storage_settings_ptr->clean_deleted_rows != CleanDeletedRows::Never);
     CreateMergeEntryResult create_result = CreateMergeEntryResult::Other;
 
     enum class AttemptStatus
@@ -3731,7 +3730,7 @@ void StorageReplicatedMergeTree::mergeSelectingTask()
                 future_merged_part->part_format,
                 deduplicate,
                 deduplicate_by_columns,
-                cleanup,
+                /*cleanup*/ false,
                 nullptr,
                 merge_pred->getVersion(),
                 future_merged_part->merge_type);
@@ -4183,23 +4182,6 @@ void StorageReplicatedMergeTree::stopBeingLeader()
     is_leader = false;
 }
 
-ConnectionTimeouts StorageReplicatedMergeTree::getFetchPartHTTPTimeouts(ContextPtr local_context)
-{
-    auto timeouts = getHTTPTimeouts(local_context);
-    auto settings = getSettings();
-
-    if (settings->replicated_fetches_http_connection_timeout.changed)
-        timeouts.connection_timeout = settings->replicated_fetches_http_connection_timeout;
-
-    if (settings->replicated_fetches_http_send_timeout.changed)
-        timeouts.send_timeout = settings->replicated_fetches_http_send_timeout;
-
-    if (settings->replicated_fetches_http_receive_timeout.changed)
-        timeouts.receive_timeout = settings->replicated_fetches_http_receive_timeout;
-
-    return timeouts;
-}
-
 bool StorageReplicatedMergeTree::checkReplicaHavePart(const String & replica, const String & part_name)
 {
     auto zookeeper = getZooKeeper();
@@ -4782,7 +4764,12 @@ bool StorageReplicatedMergeTree::fetchPart(
         get_part = [&, part_to_clone]()
         {
             chassert(!is_zero_copy_part(part_to_clone));
-            IDataPartStorage::ClonePartParams clone_params{ .keep_metadata_version = true };
+            IDataPartStorage::ClonePartParams clone_params
+            {
+                .copy_instead_of_hardlink = getSettings()->always_use_copy_instead_of_hardlinks,
+                .keep_metadata_version = true,
+            };
+
             auto [cloned_part, lock] = cloneAndLoadDataPartOnSameDisk(
                 part_to_clone,
                 "tmp_clone_",
@@ -4791,6 +4778,7 @@ bool StorageReplicatedMergeTree::fetchPart(
                 clone_params,
                 getContext()->getReadSettings(),
                 getContext()->getWriteSettings());
+
             part_directory_lock = std::move(lock);
             return cloned_part;
         };
@@ -4798,7 +4786,7 @@ bool StorageReplicatedMergeTree::fetchPart(
     else
     {
         address.fromString(zookeeper->get(fs::path(source_replica_path) / "host"));
-        timeouts = getFetchPartHTTPTimeouts(getContext());
+        timeouts = ConnectionTimeouts::getFetchPartHTTPTimeouts(getContext()->getServerSettings(), getContext()->getSettingsRef());
 
         credentials = getContext()->getInterserverCredentials();
         interserver_scheme = getContext()->getInterserverScheme();
@@ -5343,7 +5331,7 @@ void StorageReplicatedMergeTree::read(
         return readLocalSequentialConsistencyImpl(query_plan, column_names, storage_snapshot, query_info, local_context, processed_stage, max_block_size, num_streams);
 
     if (local_context->canUseParallelReplicasOnInitiator())
-        return readParallelReplicasImpl(query_plan, column_names, storage_snapshot, query_info, local_context, processed_stage, max_block_size, num_streams);
+        return readParallelReplicasImpl(query_plan, column_names, storage_snapshot, query_info, local_context, processed_stage);
 
     readLocalImpl(query_plan, column_names, storage_snapshot, query_info, local_context, processed_stage, max_block_size, num_streams);
 }
@@ -5372,18 +5360,11 @@ void StorageReplicatedMergeTree::readParallelReplicasImpl(
     const StorageSnapshotPtr & storage_snapshot,
     SelectQueryInfo & query_info,
     ContextPtr local_context,
-    QueryProcessingStage::Enum processed_stage,
-    const size_t /*max_block_size*/,
-    const size_t /*num_streams*/)
+    QueryProcessingStage::Enum processed_stage)
 {
-    auto table_id = getStorageID();
-
-    auto scalars = local_context->hasQueryContext() ? local_context->getQueryContext()->getScalars() : Scalars{};
-    String cluster_for_parallel_replicas = local_context->getSettingsRef().cluster_for_parallel_replicas;
-    auto parallel_replicas_cluster = local_context->getCluster(cluster_for_parallel_replicas);
-
     ASTPtr modified_query_ast;
     Block header;
+
     if (local_context->getSettingsRef().allow_experimental_analyzer)
     {
         auto modified_query_tree = buildQueryTreeForShard(query_info, query_info.query_tree);
@@ -5394,6 +5375,7 @@ void StorageReplicatedMergeTree::readParallelReplicasImpl(
     }
     else
     {
+        const auto table_id = getStorageID();
         modified_query_ast = ClusterProxy::rewriteSelectQuery(local_context, query_info.query,
             table_id.database_name, table_id.table_name, /*remote_table_function_ptr*/nullptr);
         header
@@ -5412,8 +5394,7 @@ void StorageReplicatedMergeTree::readParallelReplicasImpl(
         select_stream_factory,
         modified_query_ast,
         local_context,
-        query_info.storage_limits,
-        parallel_replicas_cluster);
+        query_info.storage_limits);
 }
 
 void StorageReplicatedMergeTree::readLocalImpl(
@@ -5486,6 +5467,12 @@ std::optional<UInt64> StorageReplicatedMergeTree::totalBytes(const Settings & se
     return res;
 }
 
+std::optional<UInt64> StorageReplicatedMergeTree::totalBytesUncompressed(const Settings & settings) const
+{
+    UInt64 res = 0;
+    foreachActiveParts([&res](auto & part) { res += part->getBytesUncompressedOnDisk(); }, settings.select_sequential_consistency);
+    return res;
+}
 
 void StorageReplicatedMergeTree::assertNotReadonly() const
 {
@@ -5653,7 +5640,11 @@ bool StorageReplicatedMergeTree::optimize(
         throw Exception(ErrorCodes::NOT_A_LEADER, "OPTIMIZE cannot be done on this replica because it is not a leader");
 
     if (cleanup)
+    {
+        if (!getSettings()->allow_experimental_replacing_merge_with_cleanup)
+            throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "Experimental merges with CLEANUP are not allowed");
         LOG_DEBUG(log, "Cleanup the ReplicatedMergeTree.");
+    }
 
     auto handle_noop = [&]<typename... Args>(FormatStringHelper<Args...> fmt_string, Args && ...args)
     {
@@ -6375,6 +6366,18 @@ void StorageReplicatedMergeTree::dropPartition(const ASTPtr & partition, bool de
     if (!is_leader)
         throw Exception(ErrorCodes::NOT_A_LEADER, "DROP PARTITION cannot be done on this replica because it is not a leader");
 
+    auto settings = getSettings();
+
+    if (detach && settings->disable_detach_partition_for_zero_copy_replication
+        && settings->allow_remote_fs_zero_copy_replication)
+    {
+        for (const auto & disk : getDisks())
+        {
+            if (disk->supportZeroCopyReplication())
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "DETACH PARTITION queries are disabled.");
+        }
+    }
+
     zkutil::ZooKeeperPtr zookeeper = getZooKeeperAndAssertNotReadonly();
 
     const auto * partition_ast = partition->as<ASTPartition>();
@@ -6450,9 +6453,17 @@ PartitionCommandsResultInfo StorageReplicatedMergeTree::attachPartition(
 }
 
 
-void StorageReplicatedMergeTree::checkTableCanBeDropped([[ maybe_unused ]] ContextPtr query_context) const
+void StorageReplicatedMergeTree::checkTableCanBeDropped(ContextPtr query_context) const
 {
     auto table_id = getStorageID();
+
+    const auto & query_settings = query_context->getSettingsRef();
+    if (query_settings.max_table_size_to_drop.changed)
+    {
+        getContext()->checkTableCanBeDropped(table_id.database_name, table_id.table_name, getTotalActiveSizeInBytes(), query_settings.max_table_size_to_drop);
+        return;
+    }
+
     getContext()->checkTableCanBeDropped(table_id.database_name, table_id.table_name, getTotalActiveSizeInBytes());
 }
 
@@ -7034,6 +7045,8 @@ void StorageReplicatedMergeTree::fetchPartition(
     bool fetch_part,
     ContextPtr query_context)
 {
+    auto settings = getSettings();
+
     Macros::MacroExpansionInfo info;
     info.expand_special_macros_only = false;
     info.table_id = getStorageID();
@@ -7044,6 +7057,16 @@ void StorageReplicatedMergeTree::fetchPartition(
     if (from.empty())
         throw Exception(ErrorCodes::ILLEGAL_TYPE_OF_ARGUMENT, "ZooKeeper path should not be empty");
 
+    if (settings->disable_fetch_partition_for_zero_copy_replication
+        && settings->allow_remote_fs_zero_copy_replication)
+    {
+        for (const auto & disk : getDisks())
+        {
+            if (disk->supportZeroCopyReplication())
+                throw Exception(ErrorCodes::SUPPORT_IS_DISABLED, "FETCH PARTITION queries are disabled.");
+        }
+    }
+
     zkutil::ZooKeeperPtr zookeeper;
     if (from_zookeeper_name != default_zookeeper_name)
         zookeeper = getContext()->getAuxiliaryZooKeeper(from_zookeeper_name);
@@ -7896,7 +7919,7 @@ void StorageReplicatedMergeTree::replacePartitionFrom(
                 || dynamic_cast<const MergeTreeData *>(source_table.get())->getSettings()->allow_remote_fs_zero_copy_replication;
             IDataPartStorage::ClonePartParams clone_params
             {
-                .copy_instead_of_hardlink = zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport(),
+                .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = metadata_snapshot->getMetadataVersion()
             };
             auto [dst_part, part_lock] = cloneAndLoadDataPartOnSameDisk(
@@ -8144,7 +8167,7 @@ void StorageReplicatedMergeTree::movePartitionToTable(const StoragePtr & dest_ta
 
             IDataPartStorage::ClonePartParams clone_params
             {
-                .copy_instead_of_hardlink = zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport(),
+                .copy_instead_of_hardlink = storage_settings_ptr->always_use_copy_instead_of_hardlinks || (zero_copy_enabled && src_part->isStoredOnRemoteDiskWithZeroCopySupport()),
                 .metadata_version_to_write = dest_metadata_snapshot->getMetadataVersion()
             };
             auto [dst_part, dst_part_lock] = dest_table_storage->cloneAndLoadDataPartOnSameDisk(
@@ -10259,7 +10282,7 @@ void StorageReplicatedMergeTree::backupData(
         bool exists = false;
         Strings mutation_ids;
         {
-            ZooKeeperRetriesControl retries_ctl("getMutations", zookeeper_retries_info, nullptr);
+            ZooKeeperRetriesControl retries_ctl("getMutations", log, zookeeper_retries_info, nullptr);
             retries_ctl.retryLoop([&]()
             {
                 if (!zookeeper || zookeeper->expired())
@@ -10278,7 +10301,7 @@ void StorageReplicatedMergeTree::backupData(
                 bool mutation_id_exists = false;
                 String mutation;
 
-                ZooKeeperRetriesControl retries_ctl("getMutation", zookeeper_retries_info, nullptr);
+                ZooKeeperRetriesControl retries_ctl("getMutation", log, zookeeper_retries_info, nullptr);
                 retries_ctl.retryLoop([&]()
                 {
                     if (!zookeeper || zookeeper->expired())
diff --git a/src/Storages/StorageReplicatedMergeTree.h b/src/Storages/StorageReplicatedMergeTree.h
index a8ab8eb7013..556d23d6903 100644
--- a/src/Storages/StorageReplicatedMergeTree.h
+++ b/src/Storages/StorageReplicatedMergeTree.h
@@ -165,6 +165,7 @@ public:
     std::optional<UInt64> totalRows(const Settings & settings) const override;
     std::optional<UInt64> totalRowsByPartitionPredicate(const SelectQueryInfo & query_info, ContextPtr context) const override;
     std::optional<UInt64> totalBytes(const Settings & settings) const override;
+    std::optional<UInt64> totalBytesUncompressed(const Settings & settings) const override;
 
     SinkToStoragePtr write(const ASTPtr & query, const StorageMetadataPtr & /*metadata_snapshot*/, ContextPtr context, bool async_insert) override;
 
@@ -199,8 +200,6 @@ public:
 
     void rename(const String & new_path_to_table_data, const StorageID & new_table_id) override;
 
-    bool supportsIndexForIn() const override { return true; }
-
     void checkTableCanBeDropped([[ maybe_unused ]] ContextPtr query_context) const override;
 
     ActionLock getActionLock(StorageActionBlockType action_type) override;
@@ -582,9 +581,7 @@ private:
         const StorageSnapshotPtr & storage_snapshot,
         SelectQueryInfo & query_info,
         ContextPtr local_context,
-        QueryProcessingStage::Enum processed_stage,
-        size_t max_block_size,
-        size_t num_streams);
+        QueryProcessingStage::Enum processed_stage);
 
     template <class Func>
     void foreachActiveParts(Func && func, bool select_sequential_consistency) const;
@@ -761,10 +758,6 @@ private:
         int32_t alter_version,
         int32_t log_version);
 
-    /// Exchange parts.
-
-    ConnectionTimeouts getFetchPartHTTPTimeouts(ContextPtr context);
-
     /** Returns an empty string if no one has a part.
       */
     String findReplicaHavingPart(const String & part_name, bool active);
diff --git a/src/Storages/StorageS3.cpp b/src/Storages/StorageS3.cpp
index 3094285024d..60ae7f219f4 100644
--- a/src/Storages/StorageS3.cpp
+++ b/src/Storages/StorageS3.cpp
@@ -104,6 +104,7 @@ static const std::unordered_set<std::string_view> optional_configuration_keys =
     "structure",
     "access_key_id",
     "secret_access_key",
+    "session_token",
     "filename",
     "use_environment_credentials",
     "max_single_read_retries",
@@ -1437,12 +1438,15 @@ bool StorageS3::Configuration::update(ContextPtr context)
 
 void StorageS3::Configuration::connect(ContextPtr context)
 {
+    const Settings & global_settings = context->getGlobalContext()->getSettingsRef();
+    const Settings & local_settings = context->getSettingsRef();
+
     S3::PocoHTTPClientConfiguration client_configuration = S3::ClientFactory::instance().createClientConfiguration(
         auth_settings.region,
         context->getRemoteHostFilter(),
-        static_cast<unsigned>(context->getGlobalContext()->getSettingsRef().s3_max_redirects),
-        static_cast<unsigned>(context->getGlobalContext()->getSettingsRef().s3_retry_attempts),
-        context->getGlobalContext()->getSettingsRef().enable_s3_requests_logging,
+        static_cast<unsigned>(global_settings.s3_max_redirects),
+        static_cast<unsigned>(global_settings.s3_retry_attempts),
+        global_settings.enable_s3_requests_logging,
         /* for_disk_s3 = */ false,
         request_settings.get_request_throttler,
         request_settings.put_request_throttler,
@@ -1450,17 +1454,23 @@ void StorageS3::Configuration::connect(ContextPtr context)
 
     client_configuration.endpointOverride = url.endpoint;
     client_configuration.maxConnections = static_cast<unsigned>(request_settings.max_connections);
-    client_configuration.http_connection_pool_size = context->getGlobalContext()->getSettingsRef().s3_http_connection_pool_size;
+    client_configuration.http_connection_pool_size = global_settings.s3_http_connection_pool_size;
     auto headers = auth_settings.headers;
     if (!headers_from_ast.empty())
         headers.insert(headers.end(), headers_from_ast.begin(), headers_from_ast.end());
 
     client_configuration.requestTimeoutMs = request_settings.request_timeout_ms;
 
-    auto credentials = Aws::Auth::AWSCredentials(auth_settings.access_key_id, auth_settings.secret_access_key);
+    S3::ClientSettings client_settings{
+        .use_virtual_addressing = url.is_virtual_hosted_style,
+        .disable_checksum = local_settings.s3_disable_checksum,
+        .gcs_issue_compose_request = context->getConfigRef().getBool("s3.gcs_issue_compose_request", false),
+    };
+
+    auto credentials = Aws::Auth::AWSCredentials(auth_settings.access_key_id, auth_settings.secret_access_key, auth_settings.session_token);
     client = S3::ClientFactory::instance().create(
         client_configuration,
-        url.is_virtual_hosted_style,
+        client_settings,
         credentials.GetAWSAccessKeyId(),
         credentials.GetAWSSecretKey(),
         auth_settings.server_side_encryption_customer_key_base64,
@@ -1517,11 +1527,14 @@ StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, Context
         /// S3('url', NOSIGN, 'format')
         /// S3('url', NOSIGN, 'format', 'compression')
         /// S3('url', 'aws_access_key_id', 'aws_secret_access_key')
+        /// S3('url', 'aws_access_key_id', 'aws_secret_access_key', 'session_token')
         /// S3('url', 'aws_access_key_id', 'aws_secret_access_key', 'format')
+        /// S3('url', 'aws_access_key_id', 'aws_secret_access_key', 'session_token', 'format')
         /// S3('url', 'aws_access_key_id', 'aws_secret_access_key', 'format', 'compression')
+        /// S3('url', 'aws_access_key_id', 'aws_secret_access_key', 'session_token', 'format', 'compression')
         /// with optional headers() function
 
-        if (engine_args.empty() || engine_args.size() > 5)
+        if (engine_args.empty() || engine_args.size() > 6)
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH,
                             "Storage S3 requires 1 to 5 arguments: "
                             "url, [NOSIGN | access_key_id, secret_access_key], name of used format and [compression_method]");
@@ -1537,7 +1550,7 @@ StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, Context
         static std::unordered_map<size_t, std::unordered_map<std::string_view, size_t>> size_to_engine_args
         {
             {1, {{}}},
-            {5, {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}, {"compression_method", 4}}}
+            {6, {{"access_key_id", 1}, {"secret_access_key", 2}, {"session_token", 3}, {"format", 4}, {"compression_method", 5}}}
         };
 
         std::unordered_map<std::string_view, size_t> engine_args_to_idx;
@@ -1573,7 +1586,8 @@ StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, Context
             else
                 engine_args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}};
         }
-        /// For 4 arguments we support 2 possible variants:
+        /// For 4 arguments we support 3 possible variants:
+        /// - s3(source, access_key_id, secret_access_key, session_token)
         /// - s3(source, access_key_id, secret_access_key, format)
         /// - s3(source, NOSIGN, format, compression_method)
         /// We can distinguish them by looking at the 2-nd argument: check if it's a NOSIGN or not.
@@ -1586,7 +1600,32 @@ StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, Context
                 engine_args_to_idx = {{"format", 2}, {"compression_method", 3}};
             }
             else
-                engine_args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}};
+            {
+                auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "session_token/format");
+                if (fourth_arg == "auto" || FormatFactory::instance().getAllFormats().contains(fourth_arg))
+                {
+                    engine_args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}};
+                }
+                else
+                {
+                    engine_args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"session_token", 3}};
+                }
+            }
+        }
+        /// For 5 arguments we support 2 possible variants:
+        /// - s3(source, access_key_id, secret_access_key, session_token, format)
+        /// - s3(source, access_key_id, secret_access_key, format, compression)
+        else if (engine_args.size() == 5)
+        {
+            auto fourth_arg = checkAndGetLiteralArgument<String>(engine_args[3], "session_token/format");
+            if (fourth_arg == "auto" || FormatFactory::instance().getAllFormats().contains(fourth_arg))
+            {
+                engine_args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}, {"compression", 4}};
+            }
+            else
+            {
+                engine_args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"session_token", 3}, {"format", 4}};
+            }
         }
         else
         {
@@ -1608,6 +1647,10 @@ StorageS3::Configuration StorageS3::getConfiguration(ASTs & engine_args, Context
         if (engine_args_to_idx.contains("secret_access_key"))
             configuration.auth_settings.secret_access_key = checkAndGetLiteralArgument<String>(engine_args[engine_args_to_idx["secret_access_key"]], "secret_access_key");
 
+        if (engine_args_to_idx.contains("session_token"))
+            configuration.auth_settings.session_token = checkAndGetLiteralArgument<String>(engine_args[engine_args_to_idx["session_token"]], "session_token");
+
+
         configuration.auth_settings.no_sign_request = no_sign_request;
     }
 
@@ -1649,8 +1692,15 @@ namespace
         {
         }
 
-        std::unique_ptr<ReadBuffer> next() override
+        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
         {
+            /// For default mode check cached columns for currently read keys on first iteration.
+            if (first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            {
+                if (auto cached_columns = tryGetColumnsFromCache(read_keys.begin(), read_keys.end()))
+                    return {nullptr, cached_columns};
+            }
+
             while (true)
             {
                 current_key_with_info = (*file_iterator)();
@@ -1664,36 +1714,42 @@ namespace
                             "in S3 or all files are empty. You must specify table structure manually",
                             configuration.format);
 
-                    return nullptr;
+                    return {nullptr, std::nullopt};
                 }
 
-                /// S3 file iterator could get new keys after new iteration, check them in schema cache.
-                if (getContext()->getSettingsRef().schema_inference_use_cache_for_s3 && read_keys.size() > prev_read_keys_size)
+                /// S3 file iterator could get new keys after new iteration, check them in schema cache if schema inference mode is default.
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT && read_keys.size() > prev_read_keys_size)
                 {
-                    columns_from_cache = StorageS3::tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end(), configuration, format_settings, getContext());
+                    auto columns_from_cache = tryGetColumnsFromCache(read_keys.begin() + prev_read_keys_size, read_keys.end());
                     prev_read_keys_size = read_keys.size();
                     if (columns_from_cache)
-                        return nullptr;
+                        return {nullptr, columns_from_cache};
                 }
 
                 if (getContext()->getSettingsRef().s3_skip_empty_files && current_key_with_info->info && current_key_with_info->info->size == 0)
                     continue;
 
+                /// In union mode, check cached columns only for current key.
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
+                {
+                    StorageS3::KeysWithInfo keys = {current_key_with_info};
+                    if (auto columns_from_cache = tryGetColumnsFromCache(keys.begin(), keys.end()))
+                    {
+                        first = false;
+                        return {nullptr, columns_from_cache};
+                    }
+                }
+
                 int zstd_window_log_max = static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max);
                 auto impl = std::make_unique<ReadBufferFromS3>(configuration.client, configuration.url.bucket, current_key_with_info->key, configuration.url.version_id, configuration.request_settings, getContext()->getReadSettings());
                 if (!getContext()->getSettingsRef().s3_skip_empty_files || !impl->eof())
                 {
                     first = false;
-                    return wrapReadBufferWithCompressionMethod(std::move(impl), chooseCompressionMethod(current_key_with_info->key, configuration.compression_method), zstd_window_log_max);
+                    return {wrapReadBufferWithCompressionMethod(std::move(impl), chooseCompressionMethod(current_key_with_info->key, configuration.compression_method), zstd_window_log_max), std::nullopt};
                 }
             }
         }
 
-        std::optional<ColumnsDescription> getCachedColumns() override
-        {
-            return columns_from_cache;
-        }
-
         void setNumRowsToLastFile(size_t num_rows) override
         {
             if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3)
@@ -1704,12 +1760,90 @@ namespace
             StorageS3::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
+        void setSchemaToLastFile(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::UNION)
+                return;
+
+            String source = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / configuration.url.bucket / current_key_with_info->key;
+            auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+            StorageS3::getSchemaCache(getContext()).addColumns(cache_key, columns);
+        }
+
+        void setResultingSchema(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::DEFAULT)
+                return;
+
+            auto host_and_bucket = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / configuration.url.bucket;
+            Strings sources;
+            sources.reserve(read_keys.size());
+            std::transform(read_keys.begin(), read_keys.end(), std::back_inserter(sources), [&](const auto & elem){ return host_and_bucket / elem->key; });
+            auto cache_keys = getKeysForSchemaCache(sources, configuration.format, format_settings, getContext());
+            StorageS3::getSchemaCache(getContext()).addManyColumns(cache_keys, columns);
+        }
+
+        String getLastFileName() const override
+        {
+            if (current_key_with_info)
+                return current_key_with_info->key;
+            return "";
+        }
+
     private:
+        std::optional<ColumnsDescription> tryGetColumnsFromCache(
+            const StorageS3::KeysWithInfo::const_iterator & begin,
+            const StorageS3::KeysWithInfo::const_iterator & end)
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3)
+                return std::nullopt;
+
+            auto & schema_cache = StorageS3::getSchemaCache(getContext());
+            for (auto it = begin; it < end; ++it)
+            {
+                auto get_last_mod_time = [&]
+                {
+                    time_t last_modification_time = 0;
+                    if ((*it)->info)
+                    {
+                        last_modification_time = (*it)->info->last_modification_time;
+                    }
+                    else
+                    {
+                        /// Note that in case of exception in getObjectInfo returned info will be empty,
+                        /// but schema cache will handle this case and won't return columns from cache
+                        /// because we can't say that it's valid without last modification time.
+                        last_modification_time = S3::getObjectInfo(
+                             *configuration.client,
+                             configuration.url.bucket,
+                             (*it)->key,
+                             configuration.url.version_id,
+                             configuration.request_settings,
+                             /*with_metadata=*/ false,
+                             /*for_disk_s3=*/ false,
+                             /*throw_on_error= */ false).last_modification_time;
+                    }
+
+                    return last_modification_time ? std::make_optional(last_modification_time) : std::nullopt;
+                };
+
+                String path = fs::path(configuration.url.bucket) / (*it)->key;
+                String source = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / path;
+                auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, getContext());
+                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
+                if (columns)
+                    return columns;
+            }
+
+            return std::nullopt;
+        }
+
         std::shared_ptr<StorageS3Source::IIterator> file_iterator;
         const StorageS3Source::KeysWithInfo & read_keys;
         const StorageS3::Configuration & configuration;
         const std::optional<FormatSettings> & format_settings;
-        std::optional<ColumnsDescription> columns_from_cache;
         StorageS3Source::KeyWithInfoPtr current_key_with_info;
         size_t prev_read_keys_size;
         bool first = true;
@@ -1726,28 +1860,10 @@ ColumnsDescription StorageS3::getTableStructureFromDataImpl(
 
     auto file_iterator = createFileIterator(configuration, false, ctx, {}, {}, {}, &read_keys);
 
-    std::optional<ColumnsDescription> columns_from_cache;
-    if (ctx->getSettingsRef().schema_inference_use_cache_for_s3)
-        columns_from_cache = tryGetColumnsFromCache(read_keys.begin(), read_keys.end(), configuration, format_settings, ctx);
-
-    ColumnsDescription columns;
-    if (columns_from_cache)
-    {
-        columns = *columns_from_cache;
-    }
-    else
-    {
-        ReadBufferIterator read_buffer_iterator(file_iterator, read_keys, configuration, format_settings, ctx);
-        columns = readSchemaFromFormat(configuration.format, format_settings, read_buffer_iterator, configuration.withGlobs(), ctx);
-    }
-
-    if (ctx->getSettingsRef().schema_inference_use_cache_for_s3)
-        addColumnsToCache(read_keys, configuration, columns, configuration.format, format_settings, ctx);
-
-    return columns;
+    ReadBufferIterator read_buffer_iterator(file_iterator, read_keys, configuration, format_settings, ctx);
+    return readSchemaFromFormat(configuration.format, format_settings, read_buffer_iterator, configuration.withGlobs(), ctx);
 }
 
-
 void registerStorageS3Impl(const String & name, StorageFactory & factory)
 {
     factory.registerStorage(name, [](const StorageFactory::Arguments & args)
@@ -1842,70 +1958,6 @@ SchemaCache & StorageS3::getSchemaCache(const ContextPtr & ctx)
     return schema_cache;
 }
 
-std::optional<ColumnsDescription> StorageS3::tryGetColumnsFromCache(
-    const KeysWithInfo::const_iterator & begin,
-    const KeysWithInfo::const_iterator & end,
-    const Configuration & configuration,
-    const std::optional<FormatSettings> & format_settings,
-    const ContextPtr & ctx)
-{
-    auto & schema_cache = getSchemaCache(ctx);
-    for (auto it = begin; it < end; ++it)
-    {
-        auto get_last_mod_time = [&]
-        {
-            time_t last_modification_time = 0;
-            if ((*it)->info)
-            {
-                last_modification_time = (*it)->info->last_modification_time;
-            }
-            else
-            {
-                /// Note that in case of exception in getObjectInfo returned info will be empty,
-                /// but schema cache will handle this case and won't return columns from cache
-                /// because we can't say that it's valid without last modification time.
-                last_modification_time = S3::getObjectInfo(
-                    *configuration.client,
-                    configuration.url.bucket,
-                    (*it)->key,
-                    configuration.url.version_id,
-                    configuration.request_settings,
-                    /*with_metadata=*/ false,
-                    /*for_disk_s3=*/ false,
-                    /*throw_on_error= */ false).last_modification_time;
-            }
-
-            return last_modification_time ? std::make_optional(last_modification_time) : std::nullopt;
-        };
-
-        String path = fs::path(configuration.url.bucket) / (*it)->key;
-        String source = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / path;
-        auto cache_key = getKeyForSchemaCache(source, configuration.format, format_settings, ctx);
-        auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-        if (columns)
-            return columns;
-    }
-
-    return std::nullopt;
-}
-
-void StorageS3::addColumnsToCache(
-    const KeysWithInfo & keys,
-    const Configuration & configuration,
-    const ColumnsDescription & columns,
-    const String & format_name,
-    const std::optional<FormatSettings> & format_settings,
-    const ContextPtr & ctx)
-{
-    auto host_and_bucket = fs::path(configuration.url.uri.getHost() + std::to_string(configuration.url.uri.getPort())) / configuration.url.bucket;
-    Strings sources;
-    sources.reserve(keys.size());
-    std::transform(keys.begin(), keys.end(), std::back_inserter(sources), [&](const auto & elem){ return host_and_bucket / elem->key; });
-    auto cache_keys = getKeysForSchemaCache(sources, format_name, format_settings, ctx);
-    auto & schema_cache = getSchemaCache(ctx);
-    schema_cache.addManyColumns(cache_keys, columns);
-}
-
 }
 
 #endif
diff --git a/src/Storages/StorageS3.h b/src/Storages/StorageS3.h
index 0c8c7b3f58d..07d965d8bb3 100644
--- a/src/Storages/StorageS3.h
+++ b/src/Storages/StorageS3.h
@@ -361,21 +361,6 @@ public:
 
     using KeysWithInfo = StorageS3Source::KeysWithInfo;
 
-    static std::optional<ColumnsDescription> tryGetColumnsFromCache(
-        const KeysWithInfo::const_iterator & begin,
-        const KeysWithInfo::const_iterator & end,
-        const Configuration & configuration,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & ctx);
-
-    static void addColumnsToCache(
-        const KeysWithInfo & keys,
-        const Configuration & configuration,
-        const ColumnsDescription & columns,
-        const String & format_name,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & ctx);
-
     bool supportsTrivialCountOptimization() const override { return true; }
 
 protected:
diff --git a/src/Storages/StorageS3Settings.cpp b/src/Storages/StorageS3Settings.cpp
index 0dc8d8d897b..b0c1160429a 100644
--- a/src/Storages/StorageS3Settings.cpp
+++ b/src/Storages/StorageS3Settings.cpp
@@ -6,6 +6,7 @@
 #include <Common/NamedCollections/NamedCollections.h>
 #include <Common/Exception.h>
 #include <Common/Throttler.h>
+#include <Common/formatReadable.h>
 #include <Interpreters/Context.h>
 #include <boost/algorithm/string/predicate.hpp>
 
diff --git a/src/Storages/StorageS3Settings.h b/src/Storages/StorageS3Settings.h
index 728972c948c..0e152bb2d31 100644
--- a/src/Storages/StorageS3Settings.h
+++ b/src/Storages/StorageS3Settings.h
@@ -75,6 +75,7 @@ struct S3Settings
         bool throw_on_zero_files_match = false;
 
         const PartUploadSettings & getUploadSettings() const { return upload_settings; }
+        PartUploadSettings & getUploadSettings() { return upload_settings; }
 
         void setStorageClassName(const String & storage_class_name) { upload_settings.storage_class_name = storage_class_name; }
 
diff --git a/src/Storages/StorageSnapshot.cpp b/src/Storages/StorageSnapshot.cpp
index a22ba6586ac..34c092c7208 100644
--- a/src/Storages/StorageSnapshot.cpp
+++ b/src/Storages/StorageSnapshot.cpp
@@ -35,6 +35,7 @@ void StorageSnapshot::init()
 
     if (storage.hasLightweightDeletedMask())
         system_columns[LightweightDeleteDescription::FILTER_COLUMN.name] = LightweightDeleteDescription::FILTER_COLUMN.type;
+
     system_columns[BlockNumberColumn::name] = BlockNumberColumn::type;
 }
 
diff --git a/src/Storages/StorageURL.cpp b/src/Storages/StorageURL.cpp
index cf3aa5ac175..d6b6f5af61c 100644
--- a/src/Storages/StorageURL.cpp
+++ b/src/Storages/StorageURL.cpp
@@ -32,12 +32,13 @@
 #include <Common/NamedCollections/NamedCollections.h>
 #include <Common/ProxyConfigurationResolverProvider.h>
 #include <Common/ProfileEvents.h>
+#include <Common/thread_local_rng.h>
+#include <Common/logger_useful.h>
 #include <IO/ReadWriteBufferFromHTTP.h>
 #include <IO/HTTPHeaderEntries.h>
 
 #include <algorithm>
 #include <QueryPipeline/QueryPipelineBuilder.h>
-#include <Common/logger_useful.h>
 #include <Poco/Net/HTTPRequest.h>
 #include <regex>
 #include <DataTypes/DataTypeString.h>
@@ -93,7 +94,7 @@ static bool urlWithGlobs(const String & uri)
 
 static ConnectionTimeouts getHTTPTimeouts(ContextPtr context)
 {
-    return ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), {context->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0});
+    return ConnectionTimeouts::getHTTPTimeouts(context->getSettingsRef(), context->getServerSettings().keep_alive_timeout);
 }
 
 IStorageURLBase::IStorageURLBase(
@@ -695,30 +696,53 @@ namespace
             const HTTPHeaderEntries & headers_,
             const std::optional<FormatSettings> & format_settings_,
             const ContextPtr & context_)
-            : WithContext(context_), urls_to_check(urls_to_check_), format(format_), compression_method(compression_method_), headers(headers_), format_settings(format_settings_)
+            : WithContext(context_), format(format_), compression_method(compression_method_), headers(headers_), format_settings(format_settings_)
         {
-            it = urls_to_check.cbegin();
+            url_options_to_check.reserve(urls_to_check_.size());
+            for (const auto & url : urls_to_check_)
+                url_options_to_check.push_back(getFailoverOptions(url, getContext()->getSettingsRef().glob_expansion_max_elements));
         }
 
-        std::unique_ptr<ReadBuffer> next() override
+        std::pair<std::unique_ptr<ReadBuffer>, std::optional<ColumnsDescription>> next() override
         {
+            bool is_first = (current_index == 0);
+            /// For default mode check cached columns for all urls on first iteration.
+            if (is_first && getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::DEFAULT)
+            {
+                for (const auto & options : url_options_to_check)
+                {
+                    if (auto cached_columns = tryGetColumnsFromCache(options))
+                        return {nullptr, cached_columns};
+                }
+            }
+
             std::pair<Poco::URI, std::unique_ptr<ReadWriteBufferFromHTTP>> uri_and_buf;
             do
             {
-                if (it == urls_to_check.cend())
+                if (current_index == url_options_to_check.size())
                 {
-                    if (first)
+                    if (is_first)
                         throw Exception(
                             ErrorCodes::CANNOT_EXTRACT_TABLE_STRUCTURE,
                             "Cannot extract table structure from {} format file, because all files are empty. "
                             "You must specify table structure manually",
                             format);
-                    return nullptr;
+                    return {nullptr, std::nullopt};
                 }
 
+                if (getContext()->getSettingsRef().schema_inference_mode == SchemaInferenceMode::UNION)
+                {
+                    if (auto cached_columns = tryGetColumnsFromCache(url_options_to_check[current_index]))
+                    {
+                        ++current_index;
+                        return {nullptr, cached_columns};
+                    }
+                }
+
+                auto first_option = url_options_to_check[current_index].cbegin();
                 uri_and_buf = StorageURLSource::getFirstAvailableURIAndReadBuffer(
-                    it,
-                    urls_to_check.cend(),
+                    first_option,
+                    url_options_to_check[current_index].cend(),
                     getContext(),
                     {},
                     Poco::Net::HTTPRequest::HTTP_GET,
@@ -729,35 +753,87 @@ namespace
                     false,
                     false);
 
-                ++it;
+                ++current_index;
             } while (getContext()->getSettingsRef().engine_url_skip_empty_files && uri_and_buf.second->eof());
 
-            first = false;
-            return wrapReadBufferWithCompressionMethod(
+            current_url_option = uri_and_buf.first.toString();
+            return {wrapReadBufferWithCompressionMethod(
                 std::move(uri_and_buf.second),
                 compression_method,
-                static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max));
+                static_cast<int>(getContext()->getSettingsRef().zstd_window_log_max)), std::nullopt};
         }
 
         void setNumRowsToLastFile(size_t num_rows) override
         {
-            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_s3)
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_url)
                 return;
 
-            String source = *std::prev(it);
-            auto key = getKeyForSchemaCache(source, format, format_settings, getContext());
+            auto key = getKeyForSchemaCache(current_url_option, format, format_settings, getContext());
             StorageURL::getSchemaCache(getContext()).addNumRows(key, num_rows);
         }
 
+        void setSchemaToLastFile(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_url
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::UNION)
+                return;
+
+            auto key = getKeyForSchemaCache(current_url_option, format, format_settings, getContext());
+            StorageURL::getSchemaCache(getContext()).addColumns(key, columns);
+        }
+
+        void setResultingSchema(const ColumnsDescription & columns) override
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_url
+                || getContext()->getSettingsRef().schema_inference_mode != SchemaInferenceMode::DEFAULT)
+                return;
+
+            for (const auto & options : url_options_to_check)
+            {
+                auto keys = getKeysForSchemaCache(options, format, format_settings, getContext());
+                StorageURL::getSchemaCache(getContext()).addManyColumns(keys, columns);
+            }
+        }
+
+        String getLastFileName() const override { return current_url_option; }
+
     private:
-        const std::vector<String> & urls_to_check;
-        std::vector<String>::const_iterator it;
+        std::optional<ColumnsDescription> tryGetColumnsFromCache(const Strings & urls)
+        {
+            if (!getContext()->getSettingsRef().schema_inference_use_cache_for_url)
+                return std::nullopt;
+
+            auto & schema_cache = StorageURL::getSchemaCache(getContext());
+            for (const auto & url : urls)
+            {
+                auto get_last_mod_time = [&]() -> std::optional<time_t>
+                {
+                    auto last_mod_time = StorageURL::tryGetLastModificationTime(url, headers, credentials, getContext());
+                    /// Some URLs could not have Last-Modified header, in this case we cannot be sure that
+                    /// data wasn't changed after adding it's schema to cache. Use schema from cache only if
+                    /// special setting for this case is enabled.
+                    if (!last_mod_time && !getContext()->getSettingsRef().schema_inference_cache_require_modification_time_for_url)
+                        return 0;
+                    return last_mod_time;
+                };
+
+                auto cache_key = getKeyForSchemaCache(url, format, format_settings, getContext());
+                auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
+                if (columns)
+                    return columns;
+            }
+
+            return std::nullopt;
+        }
+
+        std::vector<std::vector<String>> url_options_to_check;
+        size_t current_index = 0;
+        String current_url_option;
         const String & format;
         const CompressionMethod & compression_method;
         const HTTPHeaderEntries & headers;
         Poco::Net::HTTPBasicCredentials credentials;
         const std::optional<FormatSettings> & format_settings;
-        bool first = true;
     };
 }
 
@@ -775,39 +851,12 @@ ColumnsDescription IStorageURLBase::getTableStructureFromData(
 
     std::vector<String> urls_to_check;
     if (urlWithGlobs(uri))
-    {
-        size_t max_addresses = context->getSettingsRef().glob_expansion_max_elements;
-        auto uri_descriptions = parseRemoteDescription(uri, 0, uri.size(), ',', max_addresses, "url");
-        for (const auto & description : uri_descriptions)
-        {
-            auto options = parseRemoteDescription(description, 0, description.size(), '|', max_addresses, "url");
-            urls_to_check.insert(urls_to_check.end(), options.begin(), options.end());
-        }
-    }
+        urls_to_check = parseRemoteDescription(uri, 0, uri.size(), ',', context->getSettingsRef().glob_expansion_max_elements, "url");
     else
-    {
         urls_to_check = {uri};
-    }
 
-    std::optional<ColumnsDescription> columns_from_cache;
-    if (context->getSettingsRef().schema_inference_use_cache_for_url)
-        columns_from_cache = tryGetColumnsFromCache(urls_to_check, headers, credentials, format, format_settings, context);
-
-    ColumnsDescription columns;
-    if (columns_from_cache)
-    {
-        columns = *columns_from_cache;
-    }
-    else
-    {
-        ReadBufferIterator read_buffer_iterator(urls_to_check, format, compression_method, headers, format_settings, context);
-        columns = readSchemaFromFormat(format, format_settings, read_buffer_iterator, urls_to_check.size() > 1, context);
-    }
-
-    if (context->getSettingsRef().schema_inference_use_cache_for_url)
-        addColumnsToCache(urls_to_check, columns, format, format_settings, context);
-
-    return columns;
+    ReadBufferIterator read_buffer_iterator(urls_to_check, format, compression_method, headers, format_settings, context);
+    return readSchemaFromFormat(format, format_settings, read_buffer_iterator, urls_to_check.size() > 1, context);
 }
 
 bool IStorageURLBase::supportsSubsetOfColumns(const ContextPtr & context) const
@@ -1025,49 +1074,6 @@ SchemaCache & IStorageURLBase::getSchemaCache(const ContextPtr & context)
     return schema_cache;
 }
 
-std::optional<ColumnsDescription> IStorageURLBase::tryGetColumnsFromCache(
-    const Strings & urls,
-    const HTTPHeaderEntries & headers,
-    const Poco::Net::HTTPBasicCredentials & credentials,
-    const String & format_name,
-    const std::optional<FormatSettings> & format_settings,
-    const ContextPtr & context)
-{
-    auto & schema_cache = getSchemaCache(context);
-    for (const auto & url : urls)
-    {
-        auto get_last_mod_time = [&]() -> std::optional<time_t>
-        {
-            auto last_mod_time = tryGetLastModificationTime(url, headers, credentials, context);
-            /// Some URLs could not have Last-Modified header, in this case we cannot be sure that
-            /// data wasn't changed after adding it's schema to cache. Use schema from cache only if
-            /// special setting for this case is enabled.
-            if (!last_mod_time && !context->getSettingsRef().schema_inference_cache_require_modification_time_for_url)
-                return 0;
-            return last_mod_time;
-        };
-
-        auto cache_key = getKeyForSchemaCache(url, format_name, format_settings, context);
-        auto columns = schema_cache.tryGetColumns(cache_key, get_last_mod_time);
-        if (columns)
-            return columns;
-    }
-
-    return std::nullopt;
-}
-
-void IStorageURLBase::addColumnsToCache(
-    const Strings & urls,
-    const ColumnsDescription & columns,
-    const String & format_name,
-    const std::optional<FormatSettings> & format_settings,
-    const ContextPtr & context)
-{
-    auto & schema_cache = getSchemaCache(context);
-    auto cache_keys = getKeysForSchemaCache(urls, format_name, format_settings, context);
-    schema_cache.addManyColumns(cache_keys, columns);
-}
-
 std::optional<time_t> IStorageURLBase::tryGetLastModificationTime(
     const String & url,
     const HTTPHeaderEntries & headers,
diff --git a/src/Storages/StorageURL.h b/src/Storages/StorageURL.h
index a0ac96bf979..8d027025882 100644
--- a/src/Storages/StorageURL.h
+++ b/src/Storages/StorageURL.h
@@ -125,21 +125,6 @@ protected:
 
 private:
     virtual Block getHeaderBlock(const Names & column_names, const StorageSnapshotPtr & storage_snapshot) const = 0;
-
-    static std::optional<ColumnsDescription> tryGetColumnsFromCache(
-        const Strings & urls,
-        const HTTPHeaderEntries & headers,
-        const Poco::Net::HTTPBasicCredentials & credentials,
-        const String & format_name,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & context);
-
-    static void addColumnsToCache(
-        const Strings & urls,
-        const ColumnsDescription & columns,
-        const String & format_name,
-        const std::optional<FormatSettings> & format_settings,
-        const ContextPtr & context);
 };
 
 
diff --git a/src/Storages/StorageXDBC.cpp b/src/Storages/StorageXDBC.cpp
index 0ba8838d4c3..a569c50835c 100644
--- a/src/Storages/StorageXDBC.cpp
+++ b/src/Storages/StorageXDBC.cpp
@@ -142,7 +142,7 @@ SinkToStoragePtr StorageXDBC::write(const ASTPtr & /* query */, const StorageMet
         local_context,
         ConnectionTimeouts::getHTTPTimeouts(
             local_context->getSettingsRef(),
-            {local_context->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0}),
+            local_context->getServerSettings().keep_alive_timeout),
         compression_method);
 }
 
diff --git a/src/Storages/System/StorageSystemAsyncLoader.h b/src/Storages/System/StorageSystemAsyncLoader.h
index 1a466904df7..28c17392d08 100644
--- a/src/Storages/System/StorageSystemAsyncLoader.h
+++ b/src/Storages/System/StorageSystemAsyncLoader.h
@@ -9,7 +9,7 @@ namespace DB
 
 class Context;
 
-/// system.async_loader table. Takes data from context.getAsyncLoader()
+/// system.asynchronous_loader table. Takes data from context.getAsyncLoader()
 class StorageSystemAsyncLoader final : public IStorageSystemOneBlock<StorageSystemAsyncLoader>
 {
 public:
diff --git a/src/Storages/System/StorageSystemBackups.cpp b/src/Storages/System/StorageSystemBackups.cpp
index 46ab70ff04a..a5dd7ea6e0b 100644
--- a/src/Storages/System/StorageSystemBackups.cpp
+++ b/src/Storages/System/StorageSystemBackups.cpp
@@ -20,6 +20,7 @@ NamesAndTypesList StorageSystemBackups::getNamesAndTypes()
     NamesAndTypesList names_and_types{
         {"id", std::make_shared<DataTypeString>()},
         {"name", std::make_shared<DataTypeString>()},
+        {"base_backup_name", std::make_shared<DataTypeString>()},
         {"status", std::make_shared<DataTypeEnum8>(getBackupStatusEnumValues())},
         {"error", std::make_shared<DataTypeString>()},
         {"start_time", std::make_shared<DataTypeDateTime>()},
@@ -42,6 +43,7 @@ void StorageSystemBackups::fillData(MutableColumns & res_columns, ContextPtr con
     size_t column_index = 0;
     auto & column_id = assert_cast<ColumnString &>(*res_columns[column_index++]);
     auto & column_name = assert_cast<ColumnString &>(*res_columns[column_index++]);
+    auto & column_base_backup_name = assert_cast<ColumnString &>(*res_columns[column_index++]);
     auto & column_status = assert_cast<ColumnInt8 &>(*res_columns[column_index++]);
     auto & column_error = assert_cast<ColumnString &>(*res_columns[column_index++]);
     auto & column_start_time = assert_cast<ColumnUInt32 &>(*res_columns[column_index++]);
@@ -59,6 +61,7 @@ void StorageSystemBackups::fillData(MutableColumns & res_columns, ContextPtr con
     {
         column_id.insertData(info.id.data(), info.id.size());
         column_name.insertData(info.name.data(), info.name.size());
+        column_base_backup_name.insertData(info.base_backup_name.data(), info.base_backup_name.size());
         column_status.insertValue(static_cast<Int8>(info.status));
         column_error.insertData(info.error_message.data(), info.error_message.size());
         column_start_time.insertValue(static_cast<UInt32>(std::chrono::system_clock::to_time_t(info.start_time)));
diff --git a/src/Storages/System/StorageSystemContributors.generated.cpp b/src/Storages/System/StorageSystemContributors.generated.cpp
index c68ac39c185..fbd5afd3274 100644
--- a/src/Storages/System/StorageSystemContributors.generated.cpp
+++ b/src/Storages/System/StorageSystemContributors.generated.cpp
@@ -127,7 +127,9 @@ const char * auto_contributors[] {
     "Andrei Bodrov",
     "Andrei Ch",
     "Andrei Chulkov",
+    "Andrei Fedotov",
     "Andrei Nekrashevich",
+    "Andrej Hoos",
     "Andrew",
     "Andrew Grigorev",
     "Andrew Onyshchuk",
@@ -194,6 +196,7 @@ const char * auto_contributors[] {
     "Artur Beglaryan",
     "Artur Filatenkov",
     "Artur Malchanau",
+    "Arvind Pj",
     "Ash Vardanian",
     "AsiaKorushkina",
     "Atri Sharma",
@@ -246,6 +249,7 @@ const char * auto_contributors[] {
     "Chao Wang",
     "CheSema",
     "Chebarykov Pavel",
+    "Chen Lixiang",
     "Chen Yufei",
     "Chen768959",
     "Cheng Pan",
@@ -253,6 +257,7 @@ const char * auto_contributors[] {
     "Christian",
     "Christian Clauss",
     "Christoph Wurm",
+    "Chuan-Zheng Lee",
     "Chun-Sheng, Li",
     "Ciprian Hacman",
     "Clayton McClure",
@@ -402,6 +407,7 @@ const char * auto_contributors[] {
     "Gabriel",
     "Gabriel Archer",
     "Gagan Arneja",
+    "Gagan Goel",
     "Gao Qiang",
     "Gary Dotzler",
     "Gaurav Kumar",
@@ -498,6 +504,8 @@ const char * auto_contributors[] {
     "Jakub Kuklis",
     "James Maidment",
     "James Morrison",
+    "James Nock",
+    "James Seymour",
     "JaosnHsieh",
     "Jason",
     "Jason Keirstead",
@@ -555,6 +563,7 @@ const char * auto_contributors[] {
     "Kerry Clendinning",
     "Kevin Chiang",
     "Kevin Michel",
+    "Kevin Mingtarja",
     "Kevin Zhang",
     "KevinyhZou",
     "KinderRiven",
@@ -738,6 +747,7 @@ const char * auto_contributors[] {
     "N. Kolotov",
     "NIKITA MIKHAILOV",
     "Narek Galstyan",
+    "Natalya Chizhonkova",
     "Natasha Murashkina",
     "NeZeD [Mac Pro]",
     "Neeke Gao",
@@ -787,6 +797,7 @@ const char * auto_contributors[] {
     "Oleg Obleukhov",
     "Oleg Strokachuk",
     "Oleg Taizov",
+    "Oleg V. Kozlyuk",
     "Olga Khvostikova",
     "Olga Revyakina",
     "OmarBazaraa",
@@ -825,6 +836,7 @@ const char * auto_contributors[] {
     "Pervakov Grigorii",
     "Pervakov Grigory",
     "Petr Vasilev",
+    "Philip Hallstrom",
     "Philippe Ombredanne",
     "PigInCloud",
     "Potya",
@@ -883,6 +895,7 @@ const char * auto_contributors[] {
     "Ruzal Ibragimov",
     "Ryad ZENINE",
     "Ryadh DAHIMENE",
+    "Ryan Jacobs",
     "S.M.A. Djawadi",
     "Saad Ur Rahman",
     "Sabyanin Maxim",
@@ -917,12 +930,14 @@ const char * auto_contributors[] {
     "Sergey Kazmin",
     "Sergey Kislov",
     "Sergey Kononenko",
+    "Sergey Kviatkevich",
     "Sergey Lazarev",
     "Sergey Magidovich",
     "Sergey Mirvoda",
     "Sergey Ryzhkov",
     "Sergey Shtykov",
     "Sergey Skvortsov",
+    "Sergey Suvorov",
     "Sergey Tulentsev",
     "Sergey V. Galtsev",
     "Sergey Zaikin",
@@ -932,8 +947,10 @@ const char * auto_contributors[] {
     "SevaCode",
     "Seyed Mehrshad Hosseini",
     "Shane Andrade",
+    "Shani Elharrar",
     "Sherry Wang",
     "Shoh Jahon",
+    "Shri Bodas",
     "Sichen Zhao",
     "SiderZhang",
     "Sidorov Pavel",
@@ -1140,12 +1157,14 @@ const char * auto_contributors[] {
     "Zhichun Wu",
     "Zhiguo Zhou",
     "Zhipeng",
+    "Zhuo Qiu",
     "Zijie Lu",
     "Ziy1-Tan",
     "Zoran Pandovski",
     "[데이터플랫폼팀] 이호선",
     "a.palagashvili",
     "aaapetrenko",
+    "abakhmetev",
     "abdrakhmanov",
     "abel-wang",
     "abidino",
@@ -1178,6 +1197,7 @@ const char * auto_contributors[] {
     "andrc1901",
     "andrei-karpliuk",
     "andrewsg",
+    "andrewzolotukhin",
     "anneji",
     "anneji-dev",
     "annvsh",
@@ -1280,6 +1300,7 @@ const char * auto_contributors[] {
     "dongyifeng",
     "ducle.canh",
     "eaxdev",
+    "edef",
     "eejoin",
     "egatov",
     "ekrasikov",
@@ -1345,6 +1366,7 @@ const char * auto_contributors[] {
     "hardstep33",
     "hchen9",
     "hcz",
+    "hdhoang",
     "heleihelei",
     "helifu",
     "hendrik-m",
@@ -1393,7 +1415,9 @@ const char * auto_contributors[] {
     "jinjunzh",
     "jiyoungyoooo",
     "jkuklis",
+    "joelynch",
     "johanngan",
+    "johnnymatthews",
     "jsc0218",
     "jthmath",
     "jun won",
@@ -1414,6 +1438,7 @@ const char * auto_contributors[] {
     "koloshmet",
     "kolsys",
     "konnectr",
+    "konruvikt",
     "koshachy",
     "kothiga",
     "kreuzerkrieg",
@@ -1496,6 +1521,7 @@ const char * auto_contributors[] {
     "mayamika",
     "mehanizm",
     "melin",
+    "melvynator",
     "memo",
     "meo",
     "meoww-bot",
@@ -1566,6 +1592,7 @@ const char * auto_contributors[] {
     "pingyu",
     "pkubaj",
     "potya",
+    "pppeace",
     "presto53",
     "priera",
     "proller",
@@ -1598,9 +1625,11 @@ const char * auto_contributors[] {
     "rodrigargar",
     "roman",
     "romanzhukov",
+    "rondo_1895",
     "root",
     "roverxu",
     "ruct",
+    "ruslandoga",
     "ryzuo",
     "s-kat",
     "sanjam",
@@ -1623,6 +1652,8 @@ const char * auto_contributors[] {
     "sichenzhao",
     "simon-says",
     "simpleton",
+    "skyoct",
+    "slu",
     "slvrtrn",
     "snyk-bot",
     "songenjie",
@@ -1644,6 +1675,7 @@ const char * auto_contributors[] {
     "tai",
     "taichong",
     "taiyang-li",
+    "takakawa",
     "tangjiangling",
     "tao jiang",
     "taofengliu",
@@ -1661,6 +1693,7 @@ const char * auto_contributors[] {
     "tiger.yan",
     "timfursov",
     "tison",
+    "tomtana",
     "topvisor",
     "tpanetti",
     "turbo jason",
@@ -1707,6 +1740,7 @@ const char * auto_contributors[] {
     "xiedeyantu",
     "xieyichen",
     "xinhuitian",
+    "xleoken",
     "xlwh",
     "xmy",
     "xuelei",
@@ -1804,6 +1838,7 @@ const char * auto_contributors[] {
     "枢木",
     "王智博",
     "董海镔",
+    "袁焊忠",
     "谢磊",
     "贾顺名(Jarvis)",
     "郭小龙",
diff --git a/src/Storages/System/StorageSystemDatabaseEngines.cpp b/src/Storages/System/StorageSystemDatabaseEngines.cpp
new file mode 100644
index 00000000000..fb878a0eda0
--- /dev/null
+++ b/src/Storages/System/StorageSystemDatabaseEngines.cpp
@@ -0,0 +1,25 @@
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Databases/DatabaseFactory.h>
+#include <Storages/System/StorageSystemDatabaseEngines.h>
+
+namespace DB
+{
+
+NamesAndTypesList StorageSystemDatabaseEngines::getNamesAndTypes()
+{
+    return {
+        {"name", std::make_shared<DataTypeString>()},
+    };
+}
+
+void StorageSystemDatabaseEngines::fillData(MutableColumns & res_columns, ContextPtr, const SelectQueryInfo &) const
+{
+    for (const auto & [engine, _] : DatabaseFactory::instance().getDatabaseEngines())
+    {
+        int i = 0;
+        res_columns[i++]->insert(engine);
+    }
+}
+
+}
diff --git a/src/Storages/System/StorageSystemDatabaseEngines.h b/src/Storages/System/StorageSystemDatabaseEngines.h
new file mode 100644
index 00000000000..cd0ee541633
--- /dev/null
+++ b/src/Storages/System/StorageSystemDatabaseEngines.h
@@ -0,0 +1,22 @@
+#pragma once
+
+#include <DataTypes/DataTypeString.h>
+#include <Storages/System/IStorageSystemOneBlock.h>
+
+namespace DB
+{
+
+class StorageSystemDatabaseEngines final : public IStorageSystemOneBlock<StorageSystemDatabaseEngines>
+{
+protected:
+    void fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo & query_info) const override;
+
+    using IStorageSystemOneBlock::IStorageSystemOneBlock;
+
+public:
+    std::string getName() const override { return "SystemDatabaseEngines"; }
+
+    static NamesAndTypesList getNamesAndTypes();
+};
+
+}
diff --git a/src/Storages/System/StorageSystemDatabases.cpp b/src/Storages/System/StorageSystemDatabases.cpp
index 1fa94fab7bf..6dbe780193d 100644
--- a/src/Storages/System/StorageSystemDatabases.cpp
+++ b/src/Storages/System/StorageSystemDatabases.cpp
@@ -9,6 +9,7 @@
 #include <Storages/VirtualColumnUtils.h>
 #include <Parsers/ASTCreateQuery.h>
 #include <Common/logger_useful.h>
+#include <Parsers/formatAST.h>
 
 
 namespace DB
diff --git a/src/Storages/System/StorageSystemDisks.cpp b/src/Storages/System/StorageSystemDisks.cpp
index 23a00cc7ae5..9abbab9ff91 100644
--- a/src/Storages/System/StorageSystemDisks.cpp
+++ b/src/Storages/System/StorageSystemDisks.cpp
@@ -78,7 +78,7 @@ Pipe StorageSystemDisks::read(
 
         String cache_path;
         if (disk_ptr->supportsCache())
-            cache_path = FileCacheFactory::instance().getByName(disk_ptr->getCacheName()).settings.base_path;
+            cache_path = FileCacheFactory::instance().getByName(disk_ptr->getCacheName())->getSettings().base_path;
 
         col_cache_path->insert(cache_path);
     }
diff --git a/src/Storages/System/StorageSystemFilesystemCache.cpp b/src/Storages/System/StorageSystemFilesystemCache.cpp
index b6126f2e032..bdb941e5eae 100644
--- a/src/Storages/System/StorageSystemFilesystemCache.cpp
+++ b/src/Storages/System/StorageSystemFilesystemCache.cpp
@@ -44,8 +44,7 @@ void StorageSystemFilesystemCache::fillData(MutableColumns & res_columns, Contex
     for (const auto & [cache_name, cache_data] : caches)
     {
         const auto & cache = cache_data->cache;
-        const auto file_segments = cache->getSnapshot();
-        for (const auto & file_segment : file_segments)
+        cache->iterate([&](const FileSegment::Info & file_segment)
         {
             size_t i = 0;
             res_columns[i++]->insert(cache_name);
@@ -53,20 +52,19 @@ void StorageSystemFilesystemCache::fillData(MutableColumns & res_columns, Contex
 
             /// Do not use `file_segment->getPathInLocalCache` here because it will lead to nullptr dereference
             /// (because file_segments in getSnapshot doesn't have `cache` field set)
-            const auto path = cache->getPathInLocalCache(file_segment->key(), file_segment->offset(), file_segment->getKind());
-            res_columns[i++]->insert(path);
-            res_columns[i++]->insert(file_segment->key().toString());
 
-            const auto & range = file_segment->range();
-            res_columns[i++]->insert(range.left);
-            res_columns[i++]->insert(range.right);
-            res_columns[i++]->insert(range.size());
-            res_columns[i++]->insert(FileSegment::stateToString(file_segment->state()));
-            res_columns[i++]->insert(file_segment->getHitsCount());
-            res_columns[i++]->insert(file_segment->getRefCount());
-            res_columns[i++]->insert(file_segment->getDownloadedSize());
-            res_columns[i++]->insert(toString(file_segment->getKind()));
-            res_columns[i++]->insert(file_segment->isUnbound());
+            const auto path = cache->getPathInLocalCache(file_segment.key, file_segment.offset, file_segment.kind);
+            res_columns[i++]->insert(path);
+            res_columns[i++]->insert(file_segment.key.toString());
+            res_columns[i++]->insert(file_segment.range_left);
+            res_columns[i++]->insert(file_segment.range_right);
+            res_columns[i++]->insert(file_segment.size);
+            res_columns[i++]->insert(FileSegment::stateToString(file_segment.state));
+            res_columns[i++]->insert(file_segment.cache_hits);
+            res_columns[i++]->insert(file_segment.references);
+            res_columns[i++]->insert(file_segment.downloaded_size);
+            res_columns[i++]->insert(toString(file_segment.kind));
+            res_columns[i++]->insert(file_segment.is_unbound);
 
             std::error_code ec;
             auto size = fs::file_size(path, ec);
@@ -74,7 +72,7 @@ void StorageSystemFilesystemCache::fillData(MutableColumns & res_columns, Contex
                 res_columns[i++]->insert(size);
             else
                 res_columns[i++]->insertDefault();
-        }
+        });
     }
 }
 
diff --git a/src/Storages/System/StorageSystemKafkaConsumers.cpp b/src/Storages/System/StorageSystemKafkaConsumers.cpp
index eb7d84603c0..e333f6e2c15 100644
--- a/src/Storages/System/StorageSystemKafkaConsumers.cpp
+++ b/src/Storages/System/StorageSystemKafkaConsumers.cpp
@@ -41,6 +41,7 @@ NamesAndTypesList StorageSystemKafkaConsumers::getNamesAndTypes()
         {"num_rebalance_revocations", std::make_shared<DataTypeUInt64>()},
         {"num_rebalance_assignments", std::make_shared<DataTypeUInt64>()},
         {"is_currently_used", std::make_shared<DataTypeUInt8>()},
+        {"last_used", std::make_shared<DataTypeDateTime64>(6)},
         {"rdkafka_stat", std::make_shared<DataTypeString>()},
     };
     return names_and_types;
@@ -78,6 +79,7 @@ void StorageSystemKafkaConsumers::fillData(MutableColumns & res_columns, Context
     auto & num_rebalance_revocations = assert_cast<ColumnUInt64 &>(*res_columns[index++]);
     auto & num_rebalance_assigments = assert_cast<ColumnUInt64 &>(*res_columns[index++]);
     auto & is_currently_used = assert_cast<ColumnUInt8 &>(*res_columns[index++]);
+    auto & last_used = assert_cast<ColumnDateTime64 &>(*res_columns[index++]);
     auto & rdkafka_stat = assert_cast<ColumnString &>(*res_columns[index++]);
 
     const auto access = context->getAccess();
@@ -96,57 +98,55 @@ void StorageSystemKafkaConsumers::fillData(MutableColumns & res_columns, Context
 
         auto safe_consumers = storage_kafka_ptr->getSafeConsumers();
 
-        for (const auto & weak_consumer : safe_consumers.consumers)
+        for (const auto & consumer : safe_consumers.consumers)
         {
-            if (auto consumer = weak_consumer.lock())
+            auto consumer_stat = consumer->getStat();
+
+            database.insertData(database_str.data(), database_str.size());
+            table.insertData(table_str.data(), table_str.size());
+
+            consumer_id.insertData(consumer_stat.consumer_id.data(), consumer_stat.consumer_id.size());
+
+            const auto num_assignnemts = consumer_stat.assignments.size();
+
+            for (size_t num = 0; num < num_assignnemts; ++num)
             {
-                auto consumer_stat = consumer->getStat();
+                const auto & assign = consumer_stat.assignments[num];
 
-                database.insertData(database_str.data(), database_str.size());
-                table.insertData(table_str.data(), table_str.size());
+                assigments_topics.insertData(assign.topic_str.data(), assign.topic_str.size());
 
-                consumer_id.insertData(consumer_stat.consumer_id.data(), consumer_stat.consumer_id.size());
-
-                const auto num_assignnemts = consumer_stat.assignments.size();
-
-                for (size_t num = 0; num < num_assignnemts; ++num)
-                {
-                    const auto & assign = consumer_stat.assignments[num];
-
-                    assigments_topics.insertData(assign.topic_str.data(), assign.topic_str.size());
-
-                    assigments_partition_id.insert(assign.partition_id);
-                    assigments_current_offset.insert(assign.current_offset);
-                }
-                last_assignment_num += num_assignnemts;
-
-                assigments_topics_offsets.push_back(last_assignment_num);
-                assigments_partition_id_offsets.push_back(last_assignment_num);
-                assigments_current_offset_offsets.push_back(last_assignment_num);
-
-                for (const auto & exc : consumer_stat.exceptions_buffer)
-                {
-                    exceptions_text.insertData(exc.text.data(), exc.text.size());
-                    exceptions_time.insert(exc.timestamp_usec);
-                }
-                exceptions_num += consumer_stat.exceptions_buffer.size();
-                exceptions_text_offset.push_back(exceptions_num);
-                exceptions_time_offset.push_back(exceptions_num);
-
-
-                last_poll_time.insert(consumer_stat.last_poll_time);
-                num_messages_read.insert(consumer_stat.num_messages_read);
-                last_commit_time.insert(consumer_stat.last_commit_timestamp_usec);
-                num_commits.insert(consumer_stat.num_commits);
-                last_rebalance_time.insert(consumer_stat.last_rebalance_timestamp_usec);
-
-                num_rebalance_revocations.insert(consumer_stat.num_rebalance_revocations);
-                num_rebalance_assigments.insert(consumer_stat.num_rebalance_assignments);
-
-                is_currently_used.insert(consumer_stat.in_use);
-
-                rdkafka_stat.insertData(consumer_stat.rdkafka_stat.data(), consumer_stat.rdkafka_stat.size());
+                assigments_partition_id.insert(assign.partition_id);
+                assigments_current_offset.insert(assign.current_offset);
             }
+            last_assignment_num += num_assignnemts;
+
+            assigments_topics_offsets.push_back(last_assignment_num);
+            assigments_partition_id_offsets.push_back(last_assignment_num);
+            assigments_current_offset_offsets.push_back(last_assignment_num);
+
+            for (const auto & exc : consumer_stat.exceptions_buffer)
+            {
+                exceptions_text.insertData(exc.text.data(), exc.text.size());
+                exceptions_time.insert(exc.timestamp_usec);
+            }
+            exceptions_num += consumer_stat.exceptions_buffer.size();
+            exceptions_text_offset.push_back(exceptions_num);
+            exceptions_time_offset.push_back(exceptions_num);
+
+
+            last_poll_time.insert(consumer_stat.last_poll_time);
+            num_messages_read.insert(consumer_stat.num_messages_read);
+            last_commit_time.insert(consumer_stat.last_commit_timestamp_usec);
+            num_commits.insert(consumer_stat.num_commits);
+            last_rebalance_time.insert(consumer_stat.last_rebalance_timestamp_usec);
+
+            num_rebalance_revocations.insert(consumer_stat.num_rebalance_revocations);
+            num_rebalance_assigments.insert(consumer_stat.num_rebalance_assignments);
+
+            is_currently_used.insert(consumer_stat.in_use);
+            last_used.insert(consumer_stat.last_used_usec);
+
+            rdkafka_stat.insertData(consumer_stat.rdkafka_stat.data(), consumer_stat.rdkafka_stat.size());
         }
     };
 
diff --git a/src/Storages/System/StorageSystemMutations.cpp b/src/Storages/System/StorageSystemMutations.cpp
index fa521c632b8..b250765c4d2 100644
--- a/src/Storages/System/StorageSystemMutations.cpp
+++ b/src/Storages/System/StorageSystemMutations.cpp
@@ -28,6 +28,7 @@ NamesAndTypesList StorageSystemMutations::getNamesAndTypes()
         { "parts_to_do_names",          std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>()) },
         { "parts_to_do",                std::make_shared<DataTypeInt64>() },
         { "is_done",                    std::make_shared<DataTypeUInt8>() },
+        { "is_killed",                  std::make_shared<DataTypeUInt8>() },
         { "latest_failed_part",         std::make_shared<DataTypeString>() },
         { "latest_fail_time",           std::make_shared<DataTypeDateTime>() },
         { "latest_fail_reason",         std::make_shared<DataTypeString>() },
@@ -138,6 +139,7 @@ void StorageSystemMutations::fillData(MutableColumns & res_columns, ContextPtr c
             res_columns[col_num++]->insert(parts_to_do_names);
             res_columns[col_num++]->insert(parts_to_do_names.size());
             res_columns[col_num++]->insert(status.is_done);
+            res_columns[col_num++]->insert(status.is_killed);
             res_columns[col_num++]->insert(status.latest_failed_part);
             res_columns[col_num++]->insert(UInt64(status.latest_fail_time));
             res_columns[col_num++]->insert(status.latest_fail_reason);
diff --git a/src/Storages/System/StorageSystemNumbers.h b/src/Storages/System/StorageSystemNumbers.h
index 4c98a359ed5..fe6227db406 100644
--- a/src/Storages/System/StorageSystemNumbers.h
+++ b/src/Storages/System/StorageSystemNumbers.h
@@ -60,13 +60,6 @@ public:
     bool isSystemStorage() const override { return true; }
 
     bool supportsTransactions() const override { return true; }
-    bool supportsIndexForIn() const override { return true; }
-
-    bool mayBenefitFromIndexForIn(
-        const ASTPtr & left_in_operand, ContextPtr /* query_context */, const StorageMetadataPtr & /* metadata_snapshot */) const override
-    {
-        return left_in_operand->as<ASTIdentifier>() && left_in_operand->getColumnName() == "number";
-    }
 
 private:
     friend class ReadFromSystemNumbersStep;
diff --git a/src/Storages/System/StorageSystemPartsBase.cpp b/src/Storages/System/StorageSystemPartsBase.cpp
index 513af6cfc46..8d2e2900722 100644
--- a/src/Storages/System/StorageSystemPartsBase.cpp
+++ b/src/Storages/System/StorageSystemPartsBase.cpp
@@ -285,6 +285,8 @@ StorageSystemPartsBase::StorageSystemPartsBase(const StorageID & table_id_, Name
 
     auto add_alias = [&](const String & alias_name, const String & column_name)
     {
+        if (!tmp_columns.has(column_name))
+            return;
         ColumnDescription column(alias_name, tmp_columns.get(column_name).type);
         column.default_desc.kind = ColumnDefaultKind::Alias;
         column.default_desc.expression = std::make_shared<ASTIdentifier>(column_name);
diff --git a/src/Storages/System/StorageSystemRemoteDataPaths.cpp b/src/Storages/System/StorageSystemRemoteDataPaths.cpp
index b1cd90448ec..87b7a84e8ba 100644
--- a/src/Storages/System/StorageSystemRemoteDataPaths.cpp
+++ b/src/Storages/System/StorageSystemRemoteDataPaths.cpp
@@ -63,7 +63,7 @@ Pipe StorageSystemRemoteDataPaths::read(
             FileCachePtr cache;
 
             if (disk->supportsCache())
-                cache = FileCacheFactory::instance().getByName(disk->getCacheName()).cache;
+                cache = FileCacheFactory::instance().getByName(disk->getCacheName())->cache;
 
             for (const auto & [local_path, storage_objects] : remote_paths_by_local_path)
             {
diff --git a/src/Storages/System/StorageSystemSchemaInferenceCache.cpp b/src/Storages/System/StorageSystemSchemaInferenceCache.cpp
index a19cb1442c9..8dada69ee68 100644
--- a/src/Storages/System/StorageSystemSchemaInferenceCache.cpp
+++ b/src/Storages/System/StorageSystemSchemaInferenceCache.cpp
@@ -40,7 +40,8 @@ NamesAndTypesList StorageSystemSchemaInferenceCache::getNamesAndTypes()
         {"additional_format_info", std::make_shared<DataTypeString>()},
         {"registration_time", std::make_shared<DataTypeDateTime>()},
         {"schema", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeString>())},
-        {"number_of_rows", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())}
+        {"number_of_rows", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
+        {"schema_inference_mode", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeString>())},
     };
 }
 
@@ -64,6 +65,7 @@ static void fillDataImpl(MutableColumns & res_columns, SchemaCache & schema_cach
             res_columns[6]->insert(*schema_info.num_rows);
         else
             res_columns[6]->insertDefault();
+        res_columns[7]->insert(key.schema_inference_mode);
     }
 }
 
diff --git a/src/Storages/System/StorageSystemServerSettings.cpp b/src/Storages/System/StorageSystemServerSettings.cpp
index 3a3acabc5a3..439e3972bc7 100644
--- a/src/Storages/System/StorageSystemServerSettings.cpp
+++ b/src/Storages/System/StorageSystemServerSettings.cpp
@@ -46,17 +46,20 @@ void StorageSystemServerSettings::fillData(MutableColumns & res_columns, Context
         {"max_concurrent_insert_queries", std::to_string(context->getProcessList().getMaxInsertQueriesAmount())},
         {"max_concurrent_select_queries", std::to_string(context->getProcessList().getMaxSelectQueriesAmount())},
 
-        {"background_pool_size", std::to_string(context->getMergeMutateExecutor()->getMaxThreads())},
-        {"background_move_pool_size", std::to_string(context->getMovesExecutor()->getMaxThreads())},
-        {"background_fetches_pool_size", std::to_string(context->getFetchesExecutor()->getMaxThreads())},
-        {"background_common_pool_size", std::to_string(context->getCommonExecutor()->getMaxThreads())},
-
         {"background_buffer_flush_schedule_pool_size", std::to_string(CurrentMetrics::get(CurrentMetrics::BackgroundBufferFlushSchedulePoolSize))},
         {"background_schedule_pool_size", std::to_string(CurrentMetrics::get(CurrentMetrics::BackgroundSchedulePoolSize))},
         {"background_message_broker_schedule_pool_size", std::to_string(CurrentMetrics::get(CurrentMetrics::BackgroundMessageBrokerSchedulePoolSize))},
         {"background_distributed_schedule_pool_size", std::to_string(CurrentMetrics::get(CurrentMetrics::BackgroundDistributedSchedulePoolSize))}
     };
 
+    if (context->areBackgroundExecutorsInitialized())
+    {
+        updated.insert({"background_pool_size", std::to_string(context->getMergeMutateExecutor()->getMaxThreads())});
+        updated.insert({"background_move_pool_size", std::to_string(context->getMovesExecutor()->getMaxThreads())});
+        updated.insert({"background_fetches_pool_size", std::to_string(context->getFetchesExecutor()->getMaxThreads())});
+        updated.insert({"background_common_pool_size", std::to_string(context->getCommonExecutor()->getMaxThreads())});
+    }
+
     const auto & config = context->getConfigRef();
     ServerSettings settings;
     settings.loadSettingsFromConfig(config);
diff --git a/src/Storages/System/StorageSystemStackTrace.cpp b/src/Storages/System/StorageSystemStackTrace.cpp
index 477b784952e..e02d4bf1733 100644
--- a/src/Storages/System/StorageSystemStackTrace.cpp
+++ b/src/Storages/System/StorageSystemStackTrace.cpp
@@ -1,4 +1,4 @@
-#ifdef OS_LINUX /// Because of 'sigqueue' functions and RT signals.
+#ifdef OS_LINUX /// Because of 'rt_tgsigqueueinfo' functions and RT signals.
 
 #include <csignal>
 #include <poll.h>
@@ -6,6 +6,7 @@
 #include <mutex>
 #include <filesystem>
 #include <unordered_map>
+#include <memory>
 
 #include <base/scope_guard.h>
 
@@ -24,11 +25,16 @@
 #include <Common/HashTable/Hash.h>
 #include <Common/logger_useful.h>
 #include <Common/Stopwatch.h>
+#include <Core/ColumnsWithTypeAndName.h>
 #include <Interpreters/Context.h>
+#include <Interpreters/TranslateQualifiedNamesVisitor.h>
 #include <Processors/Sources/SourceFromSingleChunk.h>
+#include <Processors/QueryPlan/SourceStepWithFilter.h>
+#include <Processors/QueryPlan/QueryPlan.h>
 #include <QueryPipeline/Pipe.h>
+#include <QueryPipeline/QueryPipelineBuilder.h>
 #include <base/getThreadId.h>
-
+#include <sys/syscall.h>
 
 namespace DB
 {
@@ -48,8 +54,8 @@ namespace
 {
 
 // Initialized in StorageSystemStackTrace's ctor and used in signalHandler.
-std::atomic<pid_t> expected_pid;
-const int sig = SIGRTMIN;
+std::atomic<pid_t> server_pid;
+const int STACK_TRACE_SERVICE_SIGNAL = SIGRTMIN;
 
 std::atomic<int> sequence_num = 0;    /// For messages sent via pipe.
 std::atomic<int> data_ready_num = 0;
@@ -57,12 +63,13 @@ std::atomic<bool> signal_latch = false;   /// Only need for thread sanitizer.
 
 /** Notes:
   * Only one query from the table can be processed at the moment of time.
-  * This is ensured by the mutex in fillData function.
+  * This is ensured by the mutex in StorageSystemStackTraceSource.
   * We obtain information about threads by sending signal and receiving info from the signal handler.
   * Information is passed via global variables and pipe is used for signaling.
   * Actually we can send all information via pipe, but we read from it with timeout just in case,
-  * so it's convenient to use is only for signaling.
+  * so it's convenient to use it only for signaling.
   */
+std::mutex mutex;
 
 StackTrace stack_trace{NoCapture{}};
 
@@ -72,6 +79,11 @@ size_t query_id_size = 0;
 
 LazyPipeFDs notification_pipe;
 
+int rt_tgsigqueueinfo(pid_t tgid, pid_t tid, int sig, siginfo_t *info)
+{
+    return static_cast<int>(syscall(__NR_rt_tgsigqueueinfo, tgid, tid, sig, info));
+}
+
 void signalHandler(int, siginfo_t * info, void * context)
 {
     DENY_ALLOCATIONS_IN_SCOPE;
@@ -79,7 +91,7 @@ void signalHandler(int, siginfo_t * info, void * context)
 
     /// In case malicious user is sending signals manually (for unknown reason).
     /// If we don't check - it may break our synchronization.
-    if (info->si_pid != expected_pid)
+    if (info->si_pid != server_pid)
         return;
 
     /// Signal received too late.
@@ -132,7 +144,7 @@ bool wait(int timeout_ms)
                 continue;
             }
 
-            throwFromErrno("Cannot poll pipe", ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+            throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, "Cannot poll pipe");
         }
         if (poll_res == 0)
             return false;
@@ -145,7 +157,7 @@ bool wait(int timeout_ms)
             if (errno == EINTR)
                 continue;
 
-            throwFromErrno("Cannot read from pipe", ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR);
+            throw ErrnoException(ErrorCodes::CANNOT_READ_FROM_FILE_DESCRIPTOR, "Cannot read from pipe");
         }
 
         if (read_res == sizeof(notification_num))
@@ -161,7 +173,7 @@ bool wait(int timeout_ms)
 }
 
 using ThreadIdToName = std::unordered_map<UInt64, String, DefaultHash<UInt64>>;
-ThreadIdToName getFilteredThreadNames(ASTPtr query, ContextPtr context, const PaddedPODArray<UInt64> & thread_ids, Poco::Logger * log)
+ThreadIdToName getFilteredThreadNames(const ActionsDAG::Node * predicate, ContextPtr context, const PaddedPODArray<UInt64> & thread_ids, Poco::Logger * log)
 {
     ThreadIdToName tid_to_name;
     MutableColumnPtr all_thread_names = ColumnString::create();
@@ -189,10 +201,10 @@ ThreadIdToName getFilteredThreadNames(ASTPtr query, ContextPtr context, const Pa
         tid_to_name[tid] = thread_name;
         all_thread_names->insert(thread_name);
     }
-    LOG_TEST(log, "Read {} thread names for {} threads, took {} ms", tid_to_name.size(), thread_ids.size(), watch.elapsedMilliseconds());
+    LOG_TRACE(log, "Read {} thread names for {} threads, took {} ms", tid_to_name.size(), thread_ids.size(), watch.elapsedMilliseconds());
 
     Block block { ColumnWithTypeAndName(std::move(all_thread_names), std::make_shared<DataTypeString>(), "thread_name") };
-    VirtualColumnUtils::filterBlockWithQuery(query, block, context);
+    VirtualColumnUtils::filterBlockWithPredicate(predicate, block, context);
     ColumnPtr thread_names = std::move(block.getByPosition(0).column);
 
     std::unordered_set<String> filtered_thread_names;
@@ -213,22 +225,69 @@ ThreadIdToName getFilteredThreadNames(ASTPtr query, ContextPtr context, const Pa
     return tid_to_name;
 }
 
+bool parseHexNumber(std::string_view sv, UInt64 & res)
+{
+    errno = 0; /// Functions strto* don't clear errno.
+    char * pos_integer = const_cast<char *>(sv.begin());
+    res = std::strtoull(sv.begin(), &pos_integer, 16);
+    return (pos_integer == sv.begin() + sv.size() && errno != ERANGE);
+}
+bool isSignalBlocked(UInt64 tid, int signal)
+{
+    String buffer;
+
+    try
+    {
+        ReadBufferFromFile status(fmt::format("/proc/{}/status", tid));
+        while (!status.eof())
+        {
+            readEscapedStringUntilEOL(buffer, status);
+            if (!status.eof())
+                ++status.position();
+            if (buffer.starts_with("SigBlk:"))
+                break;
+        }
+        status.close();
+
+        std::string_view line(buffer);
+        line = line.substr(strlen("SigBlk:"));
+        line = line.substr(0, line.rend() - std::find_if_not(line.rbegin(), line.rend(), ::isspace));
+
+        UInt64 sig_blk;
+        if (parseHexNumber(line, sig_blk))
+            return sig_blk & signal;
+    }
+    catch (const Exception & e)
+    {
+        /// Ignore TOCTOU error
+        if (e.code() != ErrorCodes::FILE_DOESNT_EXIST)
+            throw;
+    }
+
+    return false;
+}
+
 /// Send a signal to every thread and wait for result.
 /// We must wait for every thread one by one sequentially,
 ///  because there is a limit on number of queued signals in OS and otherwise signals may get lost.
 /// Also, non-RT signals are not delivered if previous signal is handled right now (by default; but we use RT signals).
-class StorageSystemStackTraceSource : public ISource
+class StackTraceSource : public ISource
 {
 public:
-    StorageSystemStackTraceSource(const Names & column_names, Block header_, const ASTPtr query_, ContextPtr context_, UInt64 max_block_size_, Poco::Logger * log_)
+    StackTraceSource(const Names & column_names, Block header_, ASTPtr && query_, ActionsDAGPtr && filter_dag_, ContextPtr context_, UInt64 max_block_size_, Poco::Logger * log_)
         : ISource(header_)
         , context(context_)
         , header(std::move(header_))
-        , query(query_)
+        , query(std::move(query_))
+        , filter_dag(std::move(filter_dag_))
+        , predicate(filter_dag ? filter_dag->getOutputs().at(0) : nullptr)
         , max_block_size(max_block_size_)
         , pipe_read_timeout_ms(static_cast<int>(context->getSettingsRef().storage_system_stack_trace_pipe_read_timeout_ms.totalMilliseconds()))
         , log(log_)
         , proc_it("/proc/self/task")
+        /// It shouldn't be possible to do concurrent reads from this table.
+        , lock(mutex)
+        , signal_str(strsignal(STACK_TRACE_SERVICE_SIGNAL)) /// NOLINT(concurrency-mt-unsafe) // not thread-safe but ok in this context
     {
         /// Create a mask of what columns are needed in the result.
         NameSet names_set(column_names.begin(), column_names.end());
@@ -241,25 +300,23 @@ public:
 protected:
     Chunk generate() override
     {
-        /// It shouldn't be possible to do concurrent reads from this table.
-        std::lock_guard lock(mutex);
-
         MutableColumns res_columns = header.cloneEmptyColumns();
 
         ColumnPtr thread_ids;
         {
             Stopwatch watch;
             thread_ids = getFilteredThreadIds();
-            LOG_TEST(log, "Read {} threads, took {} ms", thread_ids->size(), watch.elapsedMilliseconds());
+            LOG_TRACE(log, "Read {} threads, took {} ms", thread_ids->size(), watch.elapsedMilliseconds());
         }
         if (thread_ids->empty())
             return Chunk();
 
         const auto & thread_ids_data = assert_cast<const ColumnUInt64 &>(*thread_ids).getData();
 
+        /// NOTE: This is racy, so you may get incorrect thread_name.
         ThreadIdToName thread_names;
         if (read_thread_names)
-            thread_names = getFilteredThreadNames(query, context, thread_ids_data, log);
+            thread_names = getFilteredThreadNames(predicate, context, thread_ids_data, log);
 
         for (UInt64 tid : thread_ids_data)
         {
@@ -283,56 +340,74 @@ protected:
             }
             else
             {
-                ++signals_sent;
-                Stopwatch watch;
-                SCOPE_EXIT({ signals_sent_ms += watch.elapsedMilliseconds(); });
-
-                sigval sig_value{};
-
-                sig_value.sival_int = sequence_num.load(std::memory_order_acquire);
-                if (0 != ::sigqueue(static_cast<int>(tid), sig, sig_value))
+                /// NOTE: This check is racy (thread can be
+                /// destroyed/replaced/...), but it is OK, since only the
+                /// following could happen:
+                /// - it will incorrectly detect that the signal is blocked and
+                ///   will not send it this time
+                /// - it will incorrectly detect that the signal is not blocked
+                ///   then it will wait storage_system_stack_trace_pipe_read_timeout_ms
+                bool signal_blocked = isSignalBlocked(tid, STACK_TRACE_SERVICE_SIGNAL);
+                if (!signal_blocked)
                 {
-                    /// The thread may has been already finished.
-                    if (ESRCH == errno)
+                    ++signals_sent;
+                    Stopwatch watch;
+                    SCOPE_EXIT({
+                        signals_sent_ms += watch.elapsedMilliseconds();
+
+                        /// Signed integer overflow is undefined behavior in both C and C++. However, according to
+                        /// C++ standard, Atomic signed integer arithmetic is defined to use two's complement; there
+                        /// are no undefined results. See https://en.cppreference.com/w/cpp/atomic/atomic and
+                        /// http://eel.is/c++draft/atomics.types.generic#atomics.types.int-8
+                        ++sequence_num;
+                    });
+
+                    siginfo_t sig_info{};
+                    sig_info.si_code = SI_QUEUE; /// sigqueue()
+                    sig_info.si_pid = server_pid;
+                    sig_info.si_value.sival_int = sequence_num.load(std::memory_order_acquire);
+
+                    if (0 != rt_tgsigqueueinfo(server_pid, static_cast<pid_t>(tid), STACK_TRACE_SERVICE_SIGNAL, &sig_info))
+                    {
+                        /// The thread may has been already finished.
+                        if (ESRCH == errno)
+                            continue;
+
+                        throw ErrnoException(ErrorCodes::CANNOT_SIGQUEUE, "Cannot queue a signal");
+                    }
+
+                    /// Just in case we will wait for pipe with timeout. In case signal didn't get processed.
+                    if (wait(pipe_read_timeout_ms) && sig_info.si_value.sival_int == data_ready_num.load(std::memory_order_acquire))
+                    {
+                        size_t stack_trace_size = stack_trace.getSize();
+                        size_t stack_trace_offset = stack_trace.getOffset();
+
+                        Array arr;
+                        arr.reserve(stack_trace_size - stack_trace_offset);
+                        for (size_t i = stack_trace_offset; i < stack_trace_size; ++i)
+                            arr.emplace_back(reinterpret_cast<intptr_t>(stack_trace.getFramePointers()[i]));
+
+                        res_columns[res_index++]->insert(thread_name);
+                        res_columns[res_index++]->insert(tid);
+                        res_columns[res_index++]->insertData(query_id_data, query_id_size);
+                        res_columns[res_index++]->insert(arr);
+
                         continue;
-
-                    throwFromErrno("Cannot send signal with sigqueue", ErrorCodes::CANNOT_SIGQUEUE);
+                    }
                 }
 
-                /// Just in case we will wait for pipe with timeout. In case signal didn't get processed.
-                if (wait(pipe_read_timeout_ms) && sig_value.sival_int == data_ready_num.load(std::memory_order_acquire))
-                {
-                    size_t stack_trace_size = stack_trace.getSize();
-                    size_t stack_trace_offset = stack_trace.getOffset();
-
-                    Array arr;
-                    arr.reserve(stack_trace_size - stack_trace_offset);
-                    for (size_t i = stack_trace_offset; i < stack_trace_size; ++i)
-                        arr.emplace_back(reinterpret_cast<intptr_t>(stack_trace.getFramePointers()[i]));
-
-                    res_columns[res_index++]->insert(thread_name);
-                    res_columns[res_index++]->insert(tid);
-                    res_columns[res_index++]->insertData(query_id_data, query_id_size);
-                    res_columns[res_index++]->insert(arr);
-                }
+                if (signal_blocked)
+                    LOG_DEBUG(log, "Thread {} ({}) blocks SIG{} signal", tid, thread_name, signal_str);
                 else
-                {
-                    LOG_DEBUG(log, "Cannot obtain a stack trace for thread {}", tid);
+                    LOG_DEBUG(log, "Cannot obtain a stack trace for thread {} ({})", tid, thread_name);
 
-                    res_columns[res_index++]->insert(thread_name);
-                    res_columns[res_index++]->insert(tid);
-                    res_columns[res_index++]->insertDefault();
-                    res_columns[res_index++]->insertDefault();
-                }
-
-                /// Signed integer overflow is undefined behavior in both C and C++. However, according to
-                /// C++ standard, Atomic signed integer arithmetic is defined to use two's complement; there
-                /// are no undefined results. See https://en.cppreference.com/w/cpp/atomic/atomic and
-                /// http://eel.is/c++draft/atomics.types.generic#atomics.types.int-8
-                ++sequence_num;
+                res_columns[res_index++]->insert(thread_name);
+                res_columns[res_index++]->insert(tid);
+                res_columns[res_index++]->insertDefault();
+                res_columns[res_index++]->insertDefault();
             }
         }
-        LOG_TEST(log, "Send signal to {} threads (total), took {} ms", signals_sent, signals_sent_ms);
+        LOG_TRACE(log, "Send signal to {} threads (total), took {} ms", signals_sent, signals_sent_ms);
 
         UInt64 num_rows = res_columns.at(0)->size();
         Chunk chunk(std::move(res_columns), num_rows);
@@ -343,6 +418,8 @@ private:
     ContextPtr context;
     Block header;
     const ASTPtr query;
+    const ActionsDAGPtr filter_dag;
+    const ActionsDAG::Node * predicate;
 
     const size_t max_block_size;
     const int pipe_read_timeout_ms;
@@ -357,7 +434,8 @@ private:
     size_t signals_sent = 0;
     size_t signals_sent_ms = 0;
 
-    std::mutex mutex;
+    std::unique_lock<std::mutex> lock;
+    const char * signal_str;
 
     ColumnPtr getFilteredThreadIds()
     {
@@ -372,11 +450,55 @@ private:
         }
 
         Block block { ColumnWithTypeAndName(std::move(all_thread_ids), std::make_shared<DataTypeUInt64>(), "thread_id") };
-        VirtualColumnUtils::filterBlockWithQuery(query, block, context);
+        VirtualColumnUtils::filterBlockWithPredicate(predicate, block, context);
+
         return block.getByPosition(0).column;
     }
 };
 
+class ReadFromSystemStackTrace : public SourceStepWithFilter
+{
+public:
+    std::string getName() const override { return "ReadFromSystemStackTrace"; }
+
+    void initializePipeline(QueryPipelineBuilder & pipeline, const BuildQueryPipelineSettings &) override
+    {
+        auto filter_actions_dag = ActionsDAG::buildFilterActionsDAG(filter_nodes.nodes, {}, context);
+        Pipe pipe(std::make_shared<StackTraceSource>(
+            column_names,
+            getOutputStream().header,
+            std::move(query),
+            std::move(filter_actions_dag),
+            context,
+            max_block_size,
+            log));
+        pipeline.init(std::move(pipe));
+    }
+
+    ReadFromSystemStackTrace(
+        const Names & column_names_,
+        Block sample_block,
+        ASTPtr && query_,
+        ContextPtr context_,
+        size_t max_block_size_,
+        Poco::Logger * log_)
+        : SourceStepWithFilter(DataStream{.header = std::move(sample_block)})
+        , column_names(column_names_)
+        , query(query_)
+        , context(std::move(context_))
+        , max_block_size(max_block_size_)
+        , log(log_)
+    {
+    }
+
+private:
+    Names column_names;
+    ASTPtr query;
+    ContextPtr context;
+    size_t max_block_size;
+    Poco::Logger * log;
+};
+
 }
 
 
@@ -396,39 +518,43 @@ StorageSystemStackTrace::StorageSystemStackTrace(const StorageID & table_id_)
     notification_pipe.open();
 
     /// Setup signal handler.
-    expected_pid = getpid();
+    server_pid = getpid();
     struct sigaction sa{};
     sa.sa_sigaction = signalHandler;
     sa.sa_flags = SA_SIGINFO;
 
     if (sigemptyset(&sa.sa_mask))
-        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+        throw ErrnoException(ErrorCodes::CANNOT_MANIPULATE_SIGSET, "Cannot set signal handler");
 
-    if (sigaddset(&sa.sa_mask, sig))
-        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_MANIPULATE_SIGSET);
+    if (sigaddset(&sa.sa_mask, STACK_TRACE_SERVICE_SIGNAL))
+        throw ErrnoException(ErrorCodes::CANNOT_MANIPULATE_SIGSET, "Cannot set signal handler");
 
-    if (sigaction(sig, &sa, nullptr))
-        throwFromErrno("Cannot set signal handler.", ErrorCodes::CANNOT_SET_SIGNAL_HANDLER);
+    if (sigaction(STACK_TRACE_SERVICE_SIGNAL, &sa, nullptr))
+        throw ErrnoException(ErrorCodes::CANNOT_SET_SIGNAL_HANDLER, "Cannot set signal handler");
 }
 
 
-Pipe StorageSystemStackTrace::read(
+void StorageSystemStackTrace::read(
+    QueryPlan & query_plan,
     const Names & column_names,
     const StorageSnapshotPtr & storage_snapshot,
     SelectQueryInfo & query_info,
     ContextPtr context,
     QueryProcessingStage::Enum /*processed_stage*/,
-    const size_t max_block_size,
-    const size_t /*num_streams*/)
+    size_t max_block_size,
+    size_t /*num_streams*/)
 {
     storage_snapshot->check(column_names);
-    return Pipe(std::make_shared<StorageSystemStackTraceSource>(
+    Block sample_block = storage_snapshot->metadata->getSampleBlock();
+
+    auto reading = std::make_unique<ReadFromSystemStackTrace>(
         column_names,
-        storage_snapshot->metadata->getSampleBlock(),
+        sample_block,
         query_info.query->clone(),
         context,
         max_block_size,
-        log));
+        log);
+    query_plan.addStep(std::move(reading));
 }
 
 }
diff --git a/src/Storages/System/StorageSystemStackTrace.h b/src/Storages/System/StorageSystemStackTrace.h
index 9f15499ce90..18216cea1bd 100644
--- a/src/Storages/System/StorageSystemStackTrace.h
+++ b/src/Storages/System/StorageSystemStackTrace.h
@@ -25,14 +25,15 @@ public:
 
     String getName() const override { return "SystemStackTrace"; }
 
-    Pipe read(
+    void read(
+        QueryPlan & query_plan,
         const Names & column_names,
         const StorageSnapshotPtr & storage_snapshot,
         SelectQueryInfo & query_info,
         ContextPtr context,
-        QueryProcessingStage::Enum processed_stage,
+        QueryProcessingStage::Enum /*processed_stage*/,
         size_t max_block_size,
-        size_t num_streams) override;
+        size_t /*num_streams*/) override;
 
     bool isSystemStorage() const override { return true; }
 
diff --git a/src/Storages/System/StorageSystemTables.cpp b/src/Storages/System/StorageSystemTables.cpp
index 7378ef85073..53b28543bf1 100644
--- a/src/Storages/System/StorageSystemTables.cpp
+++ b/src/Storages/System/StorageSystemTables.cpp
@@ -54,6 +54,7 @@ StorageSystemTables::StorageSystemTables(const StorageID & table_id_)
         {"storage_policy", std::make_shared<DataTypeString>()},
         {"total_rows", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
         {"total_bytes", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
+        {"total_bytes_uncompressed", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
         {"parts", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
         {"active_parts", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
         {"total_marks", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeUInt64>())},
@@ -518,6 +519,15 @@ protected:
                         res_columns[res_index++]->insertDefault();
                 }
 
+                if (columns_mask[src_index++])
+                {
+                    auto total_bytes_uncompressed = table->totalBytesUncompressed(settings);
+                    if (total_bytes_uncompressed)
+                        res_columns[res_index++]->insert(*total_bytes_uncompressed);
+                    else
+                        res_columns[res_index++]->insertDefault();
+                }
+
                 auto table_merge_tree = std::dynamic_pointer_cast<MergeTreeData>(table);
                 if (columns_mask[src_index++])
                 {
diff --git a/src/Storages/System/StorageSystemViewRefreshes.cpp b/src/Storages/System/StorageSystemViewRefreshes.cpp
new file mode 100644
index 00000000000..f27cb3147c8
--- /dev/null
+++ b/src/Storages/System/StorageSystemViewRefreshes.cpp
@@ -0,0 +1,94 @@
+#include <Storages/System/StorageSystemViewRefreshes.h>
+
+#include <Access/ContextAccess.h>
+#include <DataTypes/DataTypeArray.h>
+#include <DataTypes/DataTypeDateTime.h>
+#include <DataTypes/DataTypeNullable.h>
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <Interpreters/Context.h>
+#include <Storages/MaterializedView/RefreshSet.h>
+
+
+namespace DB
+{
+
+NamesAndTypesList StorageSystemViewRefreshes::getNamesAndTypes()
+{
+    return {
+        {"database", std::make_shared<DataTypeString>()},
+        {"view", std::make_shared<DataTypeString>()},
+        {"status", std::make_shared<DataTypeString>()},
+        {"last_refresh_result", std::make_shared<DataTypeString>()},
+        {"last_refresh_time", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeDateTime>())},
+        {"last_success_time", std::make_shared<DataTypeNullable>(std::make_shared<DataTypeDateTime>())},
+        {"duration_ms", std::make_shared<DataTypeUInt64>()},
+        {"next_refresh_time", std::make_shared<DataTypeDateTime>()},
+        {"remaining_dependencies", std::make_shared<DataTypeArray>(std::make_shared<DataTypeString>())},
+        {"exception", std::make_shared<DataTypeString>()},
+        {"refresh_count", std::make_shared<DataTypeUInt64>()},
+        {"progress", std::make_shared<DataTypeFloat64>()},
+        {"elapsed", std::make_shared<DataTypeFloat64>()},
+        {"read_rows", std::make_shared<DataTypeUInt64>()},
+        {"read_bytes", std::make_shared<DataTypeUInt64>()},
+        {"total_rows", std::make_shared<DataTypeUInt64>()},
+        {"total_bytes", std::make_shared<DataTypeUInt64>()},
+        {"written_rows", std::make_shared<DataTypeUInt64>()},
+        {"written_bytes", std::make_shared<DataTypeUInt64>()},
+        {"result_rows", std::make_shared<DataTypeUInt64>()},
+        {"result_bytes", std::make_shared<DataTypeUInt64>()},
+    };
+}
+
+void StorageSystemViewRefreshes::fillData(
+    MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo &) const
+{
+    auto access = context->getAccess();
+    auto valid_access = AccessType::SHOW_TABLES;
+    bool check_access_for_tables = !access->isGranted(valid_access);
+
+    for (const auto & refresh : context->getRefreshSet().getInfo())
+    {
+        if (check_access_for_tables && !access->isGranted(valid_access, refresh.view_id.getDatabaseName(), refresh.view_id.getTableName()))
+            continue;
+
+        std::size_t i = 0;
+        res_columns[i++]->insert(refresh.view_id.getDatabaseName());
+        res_columns[i++]->insert(refresh.view_id.getTableName());
+        res_columns[i++]->insert(toString(refresh.state));
+        res_columns[i++]->insert(toString(refresh.last_refresh_result));
+
+        if (refresh.last_attempt_time.has_value())
+            res_columns[i++]->insert(refresh.last_attempt_time.value());
+        else
+            res_columns[i++]->insertDefault(); // NULL
+
+        if (refresh.last_success_time.has_value())
+            res_columns[i++]->insert(refresh.last_success_time.value());
+        else
+            res_columns[i++]->insertDefault(); // NULL
+
+        res_columns[i++]->insert(refresh.last_attempt_duration_ms);
+        res_columns[i++]->insert(refresh.next_refresh_time);
+
+        Array deps;
+        for (const StorageID & id : refresh.remaining_dependencies)
+            deps.push_back(id.getFullTableName());
+        res_columns[i++]->insert(Array(deps));
+
+        res_columns[i++]->insert(refresh.exception_message);
+        res_columns[i++]->insert(refresh.refresh_count);
+        res_columns[i++]->insert(Float64(refresh.progress.read_rows) / refresh.progress.total_rows_to_read);
+        res_columns[i++]->insert(refresh.progress.elapsed_ns / 1e9);
+        res_columns[i++]->insert(refresh.progress.read_rows);
+        res_columns[i++]->insert(refresh.progress.read_bytes);
+        res_columns[i++]->insert(refresh.progress.total_rows_to_read);
+        res_columns[i++]->insert(refresh.progress.total_bytes_to_read);
+        res_columns[i++]->insert(refresh.progress.written_rows);
+        res_columns[i++]->insert(refresh.progress.written_bytes);
+        res_columns[i++]->insert(refresh.progress.result_rows);
+        res_columns[i++]->insert(refresh.progress.result_bytes);
+    }
+}
+
+}
diff --git a/src/Storages/System/StorageSystemViewRefreshes.h b/src/Storages/System/StorageSystemViewRefreshes.h
new file mode 100644
index 00000000000..475ad45e68f
--- /dev/null
+++ b/src/Storages/System/StorageSystemViewRefreshes.h
@@ -0,0 +1,27 @@
+#pragma once
+
+#include <DataTypes/DataTypeString.h>
+#include <DataTypes/DataTypesNumber.h>
+#include <DataTypes/DataTypeArray.h>
+#include <Storages/System/IStorageSystemOneBlock.h>
+
+
+namespace DB
+{
+
+
+class StorageSystemViewRefreshes final : public IStorageSystemOneBlock<StorageSystemViewRefreshes>
+{
+public:
+    std::string getName() const override { return "SystemViewRefreshes"; }
+
+    static NamesAndTypesList getNamesAndTypes();
+
+protected:
+    using IStorageSystemOneBlock::IStorageSystemOneBlock;
+
+    void fillData(MutableColumns & res_columns, ContextPtr context, const SelectQueryInfo & query_info) const override;
+};
+
+}
+
diff --git a/src/Storages/System/StorageSystemZooKeeper.cpp b/src/Storages/System/StorageSystemZooKeeper.cpp
index bd7c81df107..ba069380855 100644
--- a/src/Storages/System/StorageSystemZooKeeper.cpp
+++ b/src/Storages/System/StorageSystemZooKeeper.cpp
@@ -212,11 +212,6 @@ StorageSystemZooKeeper::StorageSystemZooKeeper(const StorageID & table_id_)
         setInMemoryMetadata(storage_metadata);
 }
 
-bool StorageSystemZooKeeper::mayBenefitFromIndexForIn(const ASTPtr & node, ContextPtr, const StorageMetadataPtr &) const
-{
-    return node->as<ASTIdentifier>() && node->getColumnName() == "path";
-}
-
 void StorageSystemZooKeeper::read(
     QueryPlan & query_plan,
     const Names & /*column_names*/,
diff --git a/src/Storages/System/StorageSystemZooKeeper.h b/src/Storages/System/StorageSystemZooKeeper.h
index a016d3ad74c..7f7aba862a2 100644
--- a/src/Storages/System/StorageSystemZooKeeper.h
+++ b/src/Storages/System/StorageSystemZooKeeper.h
@@ -33,8 +33,6 @@ public:
         size_t /*num_streams*/) override;
 
     bool isSystemStorage() const override { return true; }
-    bool supportsIndexForIn() const override { return true; }
-    bool mayBenefitFromIndexForIn(const ASTPtr & node, ContextPtr, const StorageMetadataPtr &) const override;
 };
 
 }
diff --git a/src/Storages/System/attachSystemTables.cpp b/src/Storages/System/attachSystemTables.cpp
index ca49a546b94..01a41fc4b40 100644
--- a/src/Storages/System/attachSystemTables.cpp
+++ b/src/Storages/System/attachSystemTables.cpp
@@ -45,6 +45,7 @@
 #include <Storages/System/StorageSystemSettings.h>
 #include <Storages/System/StorageSystemSettingsChanges.h>
 #include <Storages/System/StorageSystemMergeTreeSettings.h>
+#include <Storages/System/StorageSystemDatabaseEngines.h>
 #include <Storages/System/StorageSystemTableEngines.h>
 #include <Storages/System/StorageSystemTableFunctions.h>
 #include <Storages/System/StorageSystemTables.h>
@@ -87,6 +88,7 @@
 #include <Storages/System/StorageSystemScheduler.h>
 #include <Storages/System/StorageSystemS3Queue.h>
 #include <Storages/System/StorageSystemDashboards.h>
+#include <Storages/System/StorageSystemViewRefreshes.h>
 
 #if defined(__ELF__) && !defined(OS_FREEBSD)
 #include <Storages/System/StorageSystemSymbols.h>
@@ -108,7 +110,7 @@
 namespace DB
 {
 
-void attachSystemTablesLocal(ContextPtr context, IDatabase & system_database)
+void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, bool has_zookeeper)
 {
     attach<StorageSystemOne>(context, system_database, "one");
     attach<StorageSystemNumbers>(context, system_database, "numbers", false);
@@ -131,6 +133,7 @@ void attachSystemTablesLocal(ContextPtr context, IDatabase & system_database)
     attach<StorageSystemAggregateFunctionCombinators>(context, system_database, "aggregate_function_combinators");
     attach<StorageSystemDataTypeFamilies>(context, system_database, "data_type_families");
     attach<StorageSystemCollations>(context, system_database, "collations");
+    attach<StorageSystemDatabaseEngines>(context, system_database, "database_engines");
     attach<StorageSystemTableEngines>(context, system_database, "table_engines");
     attach<StorageSystemContributors>(context, system_database, "contributors");
     attach<StorageSystemUsers>(context, system_database, "users");
@@ -169,11 +172,6 @@ void attachSystemTablesLocal(ContextPtr context, IDatabase & system_database)
 #if USE_ROCKSDB
     attach<StorageSystemRocksDB>(context, system_database, "rocksdb");
 #endif
-}
-
-void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, bool has_zookeeper)
-{
-    attachSystemTablesLocal(context, system_database);
 
     attach<StorageSystemParts>(context, system_database, "parts");
     attach<StorageSystemProjectionParts>(context, system_database, "projection_parts");
@@ -204,11 +202,12 @@ void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, b
     attach<StorageSystemRemoteDataPaths>(context, system_database, "remote_data_paths");
     attach<StorageSystemCertificates>(context, system_database, "certificates");
     attach<StorageSystemNamedCollections>(context, system_database, "named_collections");
-    attach<StorageSystemAsyncLoader>(context, system_database, "async_loader");
+    attach<StorageSystemAsyncLoader>(context, system_database, "asynchronous_loader");
     attach<StorageSystemUserProcesses>(context, system_database, "user_processes");
     attach<StorageSystemJemallocBins>(context, system_database, "jemalloc_bins");
     attach<StorageSystemS3Queue>(context, system_database, "s3queue");
     attach<StorageSystemDashboards>(context, system_database, "dashboards");
+    attach<StorageSystemViewRefreshes>(context, system_database, "view_refreshes");
 
     if (has_zookeeper)
     {
diff --git a/src/Storages/System/attachSystemTables.h b/src/Storages/System/attachSystemTables.h
index 4c1a79f84dd..15a25a38afc 100644
--- a/src/Storages/System/attachSystemTables.h
+++ b/src/Storages/System/attachSystemTables.h
@@ -10,7 +10,6 @@ class AsynchronousMetrics;
 class IDatabase;
 
 void attachSystemTablesServer(ContextPtr context, IDatabase & system_database, bool has_zookeeper);
-void attachSystemTablesLocal(ContextPtr context, IDatabase & system_database);
 void attachSystemTablesAsync(ContextPtr context, IDatabase & system_database, AsynchronousMetrics & async_metrics);
 
 }
diff --git a/src/Storages/TTLDescription.cpp b/src/Storages/TTLDescription.cpp
index f601fed06ac..41a222525bf 100644
--- a/src/Storages/TTLDescription.cpp
+++ b/src/Storages/TTLDescription.cpp
@@ -55,22 +55,29 @@ TTLAggregateDescription & TTLAggregateDescription::operator=(const TTLAggregateD
 namespace
 {
 
-void checkTTLExpression(const ExpressionActionsPtr & ttl_expression, const String & result_column_name)
+void checkTTLExpression(const ExpressionActionsPtr & ttl_expression, const String & result_column_name, bool allow_suspicious)
 {
-    for (const auto & action : ttl_expression->getActions())
+    /// Do not apply this check in ATTACH queries for compatibility reasons and if explicitly allowed.
+    if (!allow_suspicious)
     {
-        if (action.node->type == ActionsDAG::ActionType::FUNCTION)
+        if (ttl_expression->getRequiredColumns().empty())
+            throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                "TTL expression {} does not depend on any of the columns of the table", result_column_name);
+
+        for (const auto & action : ttl_expression->getActions())
         {
-            const IFunctionBase & func = *action.node->function_base;
-            if (!func.isDeterministic())
-                throw Exception(ErrorCodes::BAD_ARGUMENTS,
-                                "TTL expression cannot contain non-deterministic functions, but contains function {}",
-                                func.getName());
+            if (action.node->type == ActionsDAG::ActionType::FUNCTION)
+            {
+                const IFunctionBase & func = *action.node->function_base;
+                if (!func.isDeterministic())
+                    throw Exception(ErrorCodes::BAD_ARGUMENTS,
+                                    "TTL expression cannot contain non-deterministic functions, but contains function {}",
+                                    func.getName());
+            }
         }
     }
 
     const auto & result_column = ttl_expression->getSampleBlock().getByName(result_column_name);
-
     if (!typeid_cast<const DataTypeDateTime *>(result_column.type.get())
         && !typeid_cast<const DataTypeDate *>(result_column.type.get()))
     {
@@ -162,7 +169,8 @@ TTLDescription TTLDescription::getTTLFromAST(
     const ASTPtr & definition_ast,
     const ColumnsDescription & columns,
     ContextPtr context,
-    const KeyDescription & primary_key)
+    const KeyDescription & primary_key,
+    bool is_attach)
 {
     TTLDescription result;
     const auto * ttl_element = definition_ast->as<ASTTTLElement>();
@@ -289,7 +297,7 @@ TTLDescription TTLDescription::getTTLFromAST(
         }
     }
 
-    checkTTLExpression(result.expression, result.result_column);
+    checkTTLExpression(result.expression, result.result_column, is_attach || context->getSettingsRef().allow_suspicious_ttl_expressions);
     return result;
 }
 
@@ -327,7 +335,8 @@ TTLTableDescription TTLTableDescription::getTTLForTableFromAST(
     const ASTPtr & definition_ast,
     const ColumnsDescription & columns,
     ContextPtr context,
-    const KeyDescription & primary_key)
+    const KeyDescription & primary_key,
+    bool is_attach)
 {
     TTLTableDescription result;
     if (!definition_ast)
@@ -338,7 +347,7 @@ TTLTableDescription TTLTableDescription::getTTLForTableFromAST(
     bool have_unconditional_delete_ttl = false;
     for (const auto & ttl_element_ptr : definition_ast->children)
     {
-        auto ttl = TTLDescription::getTTLFromAST(ttl_element_ptr, columns, context, primary_key);
+        auto ttl = TTLDescription::getTTLFromAST(ttl_element_ptr, columns, context, primary_key, is_attach);
         if (ttl.mode == TTLMode::DELETE)
         {
             if (!ttl.where_expression)
@@ -380,7 +389,7 @@ TTLTableDescription TTLTableDescription::parse(const String & str, const Columns
     ASTPtr ast = parseQuery(parser, str, 0, DBMS_DEFAULT_MAX_PARSER_DEPTH);
     FunctionNameNormalizer().visit(ast.get());
 
-    return getTTLForTableFromAST(ast, columns, context, primary_key);
+    return getTTLForTableFromAST(ast, columns, context, primary_key, context->getSettingsRef().allow_suspicious_ttl_expressions);
 }
 
 }
diff --git a/src/Storages/TTLDescription.h b/src/Storages/TTLDescription.h
index 8f60eb604b5..aab5b43e53e 100644
--- a/src/Storages/TTLDescription.h
+++ b/src/Storages/TTLDescription.h
@@ -1,4 +1,5 @@
 #pragma once
+
 #include <Parsers/IAST_fwd.h>
 #include <Storages/DataDestinationType.h>
 #include <Storages/ColumnsDescription.h>
@@ -7,6 +8,7 @@
 #include <Interpreters/AggregateDescription.h>
 #include <Storages/TTLMode.h>
 
+
 namespace DB
 {
 
@@ -82,9 +84,8 @@ struct TTLDescription
     /// Codec name which will be used to recompress data
     ASTPtr recompression_codec;
 
-    /// Parse TTL structure from definition. Able to parse both column and table
-    /// TTLs.
-    static TTLDescription getTTLFromAST(const ASTPtr & definition_ast, const ColumnsDescription & columns, ContextPtr context, const KeyDescription & primary_key);
+    /// Parse TTL structure from definition. Able to parse both column and table TTLs.
+    static TTLDescription getTTLFromAST(const ASTPtr & definition_ast, const ColumnsDescription & columns, ContextPtr context, const KeyDescription & primary_key, bool is_attach);
 
     TTLDescription() = default;
     TTLDescription(const TTLDescription & other);
@@ -121,7 +122,7 @@ struct TTLTableDescription
     TTLTableDescription & operator=(const TTLTableDescription & other);
 
     static TTLTableDescription getTTLForTableFromAST(
-        const ASTPtr & definition_ast, const ColumnsDescription & columns, ContextPtr context, const KeyDescription & primary_key);
+        const ASTPtr & definition_ast, const ColumnsDescription & columns, ContextPtr context, const KeyDescription & primary_key, bool is_attach);
 
     /// Parse description from string
     static TTLTableDescription parse(const String & str, const ColumnsDescription & columns, ContextPtr context, const KeyDescription & primary_key);
diff --git a/src/Storages/VirtualColumnUtils.cpp b/src/Storages/VirtualColumnUtils.cpp
index aed06fb0540..8da5fdb3709 100644
--- a/src/Storages/VirtualColumnUtils.cpp
+++ b/src/Storages/VirtualColumnUtils.cpp
@@ -502,9 +502,12 @@ static const ActionsDAG::Node * splitFilterNodeForAllowedInputs(
                 const ActionsDAG::Node * res = node_copy.children.front();
                 /// Expression like (not_allowed AND 256) can't be resuced to (and(256)) because AND requires
                 /// at least two arguments; also it can't be reduced to (256) because result type is different.
-                /// TODO: add CAST here
                 if (!res->result_type->equals(*node->result_type))
-                    return nullptr;
+                {
+                    ActionsDAG tmp_dag;
+                    res = &tmp_dag.addCast(*res, node->result_type, {});
+                    additional_nodes.splice(additional_nodes.end(), ActionsDAG::detachNodes(std::move(tmp_dag)));
+                }
 
                 return res;
             }
diff --git a/src/Storages/tests/gtest_transform_query_for_external_database.cpp b/src/Storages/tests/gtest_transform_query_for_external_database.cpp
index 1b2a4187c94..475cf5a4eae 100644
--- a/src/Storages/tests/gtest_transform_query_for_external_database.cpp
+++ b/src/Storages/tests/gtest_transform_query_for_external_database.cpp
@@ -320,6 +320,18 @@ TEST(TransformQueryForExternalDatabase, ForeignColumnInWhere)
           R"(SELECT "column", "apply_id" FROM "test"."table" WHERE ("column" > 2) AND ("apply_id" = 1))");
 }
 
+TEST(TransformQueryForExternalDatabase, TupleSurroundPredicates)
+{
+    const State & state = State::instance();
+
+    check(
+        state,
+        1,
+        {"column", "field", "a"},
+        "SELECT column, field, a FROM table WHERE ((column > 10) AND (length(field) > 0)) AND a > 0",
+        R"(SELECT "column", "field", "a" FROM "test"."table" WHERE ("a" > 0) AND ("column" > 10))");
+}
+
 TEST(TransformQueryForExternalDatabase, NoStrict)
 {
     const State & state = State::instance();
diff --git a/src/Storages/transformQueryForExternalDatabase.cpp b/src/Storages/transformQueryForExternalDatabase.cpp
index fd3c47e0e3f..4526a38a1c3 100644
--- a/src/Storages/transformQueryForExternalDatabase.cpp
+++ b/src/Storages/transformQueryForExternalDatabase.cpp
@@ -329,14 +329,26 @@ String transformQueryForExternalDatabaseImpl(
         }
         else if (auto * function = original_where->as<ASTFunction>())
         {
-            if (function->name == "and")
+            if (function->name == "and" || function->name == "tuple")
             {
                 auto new_function_and = makeASTFunction("and");
-                for (auto & elem : function->arguments->children)
+                std::queue<const ASTFunction *> predicates;
+                predicates.push(function);
+
+                while (!predicates.empty())
                 {
-                    if (isCompatible(elem))
-                        new_function_and->arguments->children.push_back(elem);
+                    const auto * func = predicates.front();
+                    predicates.pop();
+
+                    for (auto & elem : func->arguments->children)
+                    {
+                        if (isCompatible(elem))
+                            new_function_and->arguments->children.push_back(elem);
+                        else if (const auto * child = elem->as<ASTFunction>(); child && (child->name == "and" || child->name == "tuple"))
+                            predicates.push(child);
+                    }
                 }
+
                 if (new_function_and->arguments->children.size() == 1)
                     select->setExpression(ASTSelectQuery::Expression::WHERE, std::move(new_function_and->arguments->children[0]));
                 else if (new_function_and->arguments->children.size() > 1)
diff --git a/src/TableFunctions/ITableFunctionXDBC.cpp b/src/TableFunctions/ITableFunctionXDBC.cpp
index b1746ea769f..ca6d40a05a3 100644
--- a/src/TableFunctions/ITableFunctionXDBC.cpp
+++ b/src/TableFunctions/ITableFunctionXDBC.cpp
@@ -159,7 +159,7 @@ ColumnsDescription ITableFunctionXDBC::getActualTableStructure(ContextPtr contex
         {},
         ConnectionTimeouts::getHTTPTimeouts(
             context->getSettingsRef(),
-            {context->getConfigRef().getUInt("keep_alive_timeout", DEFAULT_HTTP_KEEP_ALIVE_TIMEOUT), 0}),
+            context->getServerSettings().keep_alive_timeout),
         credentials);
 
     std::string columns_info;
diff --git a/src/TableFunctions/TableFunctionDictionary.cpp b/src/TableFunctions/TableFunctionDictionary.cpp
index 5249487f1f5..867fbf5b11e 100644
--- a/src/TableFunctions/TableFunctionDictionary.cpp
+++ b/src/TableFunctions/TableFunctionDictionary.cpp
@@ -2,6 +2,8 @@
 
 #include <Parsers/ASTLiteral.h>
 
+#include <Access/Common/AccessFlags.h>
+
 #include <DataTypes/DataTypeArray.h>
 #include <DataTypes/DataTypeString.h>
 #include <DataTypes/DataTypesNumber.h>
@@ -78,6 +80,7 @@ ColumnsDescription TableFunctionDictionary::getActualTableStructure(ContextPtr c
 StoragePtr TableFunctionDictionary::executeImpl(
     const ASTPtr &, ContextPtr context, const std::string & table_name, ColumnsDescription, bool is_insert_query) const
 {
+    context->checkAccess(AccessType::dictGet, getDatabaseName(), table_name);
     StorageID dict_id(getDatabaseName(), table_name);
     auto dictionary_table_structure = getActualTableStructure(context, is_insert_query);
 
diff --git a/src/TableFunctions/TableFunctionFile.cpp b/src/TableFunctions/TableFunctionFile.cpp
index 45a7378ca82..8a9dde374ec 100644
--- a/src/TableFunctions/TableFunctionFile.cpp
+++ b/src/TableFunctions/TableFunctionFile.cpp
@@ -2,17 +2,14 @@
 #include <TableFunctions/ITableFunctionFileLike.h>
 #include <TableFunctions/TableFunctionFile.h>
 
-#include "Parsers/IAST_fwd.h"
 #include "registerTableFunctions.h"
 #include <Access/Common/AccessFlags.h>
 #include <Interpreters/Context.h>
 #include <Storages/ColumnsDescription.h>
 #include <Storages/StorageFile.h>
-#include <Storages/VirtualColumnUtils.h>
 #include <TableFunctions/TableFunctionFactory.h>
 #include <Interpreters/evaluateConstantExpression.h>
 #include <Formats/FormatFactory.h>
-#include <Parsers/ASTIdentifier_fwd.h>
 
 
 namespace DB
diff --git a/src/TableFunctions/TableFunctionS3.cpp b/src/TableFunctions/TableFunctionS3.cpp
index e6ae75a5fd5..c52256fb984 100644
--- a/src/TableFunctions/TableFunctionS3.cpp
+++ b/src/TableFunctions/TableFunctionS3.cpp
@@ -71,7 +71,7 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
         if (header_it != args.end())
             args.erase(header_it);
 
-        if (args.empty() || args.size() > 6)
+        if (args.empty() || args.size() > 7)
             throw Exception(ErrorCodes::NUMBER_OF_ARGUMENTS_DOESNT_MATCH, "The signature of table function {} shall be the following:\n{}", getName(), getSignature());
 
         for (auto & arg : args)
@@ -81,7 +81,7 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
         static std::unordered_map<size_t, std::unordered_map<std::string_view, size_t>> size_to_args
         {
             {1, {{}}},
-            {6, {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}, {"structure", 4}, {"compression_method", 5}}}
+            {7, {{"access_key_id", 1}, {"secret_access_key", 2}, {"session_token", 3}, {"format", 4}, {"structure", 5}, {"compression_method", 6}}}
         };
 
         std::unordered_map<std::string_view, size_t> args_to_idx;
@@ -118,11 +118,12 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
             else
                 args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}};
         }
-        /// For 4 arguments we support 3 possible variants:
+        /// For 4 arguments we support 4 possible variants:
         /// - s3(source, format, structure, compression_method),
-        /// - s3(source, access_key_id, access_key_id, format)
+        /// - s3(source, access_key_id, access_key_id, format),
+        /// - s3(source, access_key_id, access_key_id, session_token)
         /// - s3(source, NOSIGN, format, structure)
-        /// We can distinguish them by looking at the 2-nd argument: check if it's a format name or not.
+        /// We can distinguish them by looking at the 2-nd and 4-th argument: check if it's a format name or not.
         else if (args.size() == 4)
         {
             auto second_arg = checkAndGetLiteralArgument<String>(args[1], "format/access_key_id/NOSIGN");
@@ -132,14 +133,28 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
                 args_to_idx = {{"format", 2}, {"structure", 3}};
             }
             else if (second_arg == "auto" || FormatFactory::instance().getAllFormats().contains(second_arg))
+            {
                 args_to_idx = {{"format", 1}, {"structure", 2}, {"compression_method", 3}};
+            }
             else
-                args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}};
+            {
+                auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/session_token");
+                if (fourth_arg == "auto" || FormatFactory::instance().getAllFormats().contains(fourth_arg))
+                {
+                    args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}};
+                }
+                else
+                {
+                    args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"session_token", 3}};
+                }
+            }
         }
-        /// For 5 arguments we support 2 possible variants:
+        /// For 5 arguments we support 3 possible variants:
         /// - s3(source, access_key_id, access_key_id, format, structure)
+        /// - s3(source, access_key_id, access_key_id, session_token, format)
         /// - s3(source, NOSIGN, format, structure, compression_method)
-        /// We can distinguish them by looking at the 2-nd argument: check if it's a NOSIGN keyword name or not.
+        /// We can distinguish them by looking at the 2-nd argument: check if it's a NOSIGN keyword name or no,
+        /// and by the 4-th argument, check if it's a format name or not
         else if (args.size() == 5)
         {
             auto second_arg = checkAndGetLiteralArgument<String>(args[1], "NOSIGN/access_key_id");
@@ -149,7 +164,33 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
                 args_to_idx = {{"format", 2}, {"structure", 3}, {"compression_method", 4}};
             }
             else
-                args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}, {"structure", 4}};
+            {
+                auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/session_token");
+                if (fourth_arg == "auto" || FormatFactory::instance().getAllFormats().contains(fourth_arg))
+                {
+                    args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}, {"structure", 4}};
+                }
+                else
+                {
+                    args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"session_token", 3}, {"format", 4}};
+                }
+            }
+        }
+        // For 6 arguments we support 2 possible variants:
+        /// - s3(source, access_key_id, access_key_id, format, structure, compression_method)
+        /// - s3(source, access_key_id, access_key_id, session_token, format, structure)
+        /// We can distinguish them by looking at the 4-th argument: check if it's a format name or not
+        else if (args.size() == 6)
+        {
+            auto fourth_arg = checkAndGetLiteralArgument<String>(args[3], "format/session_token");
+            if (fourth_arg == "auto" || FormatFactory::instance().getAllFormats().contains(fourth_arg))
+            {
+                args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"format", 3}, {"structure", 4}, {"compression_method", 5}};
+            }
+            else
+            {
+                args_to_idx = {{"access_key_id", 1}, {"secret_access_key", 2}, {"session_token", 3}, {"format", 4}, {"structure", 5}};
+            }
         }
         else
         {
@@ -181,6 +222,9 @@ void TableFunctionS3::parseArgumentsImpl(ASTs & args, const ContextPtr & context
         if (args_to_idx.contains("secret_access_key"))
             configuration.auth_settings.secret_access_key = checkAndGetLiteralArgument<String>(args[args_to_idx["secret_access_key"]], "secret_access_key");
 
+        if (args_to_idx.contains("session_token"))
+            configuration.auth_settings.session_token = checkAndGetLiteralArgument<String>(args[args_to_idx["session_token"]], "session_token");
+
         configuration.auth_settings.no_sign_request = no_sign_request;
 
         if (configuration.format == "auto")
diff --git a/src/TableFunctions/TableFunctionS3.h b/src/TableFunctions/TableFunctionS3.h
index fc384176007..fa73c1d313e 100644
--- a/src/TableFunctions/TableFunctionS3.h
+++ b/src/TableFunctions/TableFunctionS3.h
@@ -22,11 +22,15 @@ public:
     static constexpr auto signature = " - url\n"
                                       " - url, format\n"
                                       " - url, format, structure\n"
-                                      " - url, access_key_id, secret_access_key\n"
                                       " - url, format, structure, compression_method\n"
+                                      " - url, access_key_id, secret_access_key\n"
+                                      " - url, access_key_id, secret_access_key, session_token\n"
                                       " - url, access_key_id, secret_access_key, format\n"
+                                      " - url, access_key_id, secret_access_key, session_token, format\n"
                                       " - url, access_key_id, secret_access_key, format, structure\n"
+                                      " - url, access_key_id, secret_access_key, session_token, format, structure\n"
                                       " - url, access_key_id, secret_access_key, format, structure, compression_method\n"
+                                      " - url, access_key_id, secret_access_key, session_token, format, structure, compression_method\n"
                                       "All signatures supports optional headers (specified as `headers('name'='value', 'name2'='value2')`)";
 
     static size_t getMaxNumberOfArguments() { return 6; }
diff --git a/src/TableFunctions/TableFunctionS3Cluster.h b/src/TableFunctions/TableFunctionS3Cluster.h
index 4fe25079cf4..718b0d90de8 100644
--- a/src/TableFunctions/TableFunctionS3Cluster.h
+++ b/src/TableFunctions/TableFunctionS3Cluster.h
@@ -35,6 +35,7 @@ public:
                                       " - cluster, url, access_key_id, secret_access_key, format\n"
                                       " - cluster, url, access_key_id, secret_access_key, format, structure\n"
                                       " - cluster, url, access_key_id, secret_access_key, format, structure, compression_method\n"
+                                      " - cluster, url, access_key_id, secret_access_key, session_token, format, structure, compression_method\n"
                                       "All signatures supports optional headers (specified as `headers('name'='value', 'name2'='value2')`)";
 
     String getName() const override
diff --git a/src/configure_config.cmake b/src/configure_config.cmake
index c3c6d9be6da..9358abdf7f8 100644
--- a/src/configure_config.cmake
+++ b/src/configure_config.cmake
@@ -19,9 +19,6 @@ endif()
 if (TARGET ch_contrib::rdkafka)
     set(USE_RDKAFKA 1)
 endif()
-if (TARGET ch_rust::blake3)
-    set(USE_BLAKE3 1)
-endif()
 if (TARGET ch_rust::skim)
     set(USE_SKIM 1)
 endif()
@@ -103,6 +100,7 @@ endif()
 if (TARGET ch_contrib::llvm)
     set(USE_EMBEDDED_COMPILER ${ENABLE_EMBEDDED_COMPILER})
     set(USE_DWARF_PARSER ${ENABLE_DWARF_PARSER})
+    set(USE_BLAKE3 ${ENABLE_LIBRARIES})
 endif()
 if (TARGET ch_contrib::unixodbc)
     set(USE_ODBC 1)
diff --git a/tests/analyzer_tech_debt.txt b/tests/analyzer_tech_debt.txt
index b0e611fa77b..735094df78b 100644
--- a/tests/analyzer_tech_debt.txt
+++ b/tests/analyzer_tech_debt.txt
@@ -2,7 +2,6 @@
 00717_merge_and_distributed
 00725_memory_tracking
 01062_pm_all_join_with_block_continuation
-01064_incremental_streaming_from_2_src_with_feedback
 01083_expressions_in_engine_arguments
 01155_rename_move_materialized_view
 01214_test_storage_merge_aliases_with_where
@@ -20,9 +19,7 @@
 01761_cast_to_enum_nullable
 01925_join_materialized_columns
 01925_test_storage_merge_aliases
-01947_mv_subquery
 01952_optimize_distributed_group_by_sharding_key
-02139_MV_with_scalar_subquery
 02174_cte_scalar_cache_mv
 02352_grouby_shadows_arg
 02354_annoy
@@ -36,7 +33,6 @@
 02404_memory_bound_merging
 02725_agg_projection_resprect_PK
 02763_row_policy_storage_merge_alias
-02765_parallel_replicas_final_modifier
 02784_parallel_replicas_automatic_decision_join
 02818_parameterized_view_with_cte_multiple_usage
 02815_range_dict_no_direct_join
diff --git a/tests/ci/artifacts_helper.py b/tests/ci/artifacts_helper.py
index 0d1ecafbaa5..a9f3385585b 100644
--- a/tests/ci/artifacts_helper.py
+++ b/tests/ci/artifacts_helper.py
@@ -123,9 +123,7 @@ class ArtifactsHelper:
                 return fnmatch(key, glob)
             return True
 
-        results = filter(
-            ignore, self.s3_helper.list_prefix(self.s3_prefix, S3_BUILDS_BUCKET)
-        )
+        results = filter(ignore, self.s3_helper.list_prefix(self.s3_prefix))
         return list(results)
 
     @staticmethod
diff --git a/tests/ci/ast_fuzzer_check.py b/tests/ci/ast_fuzzer_check.py
index 620462991ef..68004eec2bb 100644
--- a/tests/ci/ast_fuzzer_check.py
+++ b/tests/ci/ast_fuzzer_check.py
@@ -1,6 +1,7 @@
 #!/usr/bin/env python3
 
 import logging
+import os
 import subprocess
 import sys
 from pathlib import Path
@@ -19,11 +20,8 @@ from commit_status_helper import (
     get_commit,
     post_commit_status,
 )
-from docker_pull_helper import DockerImage, get_image_with_version
-from env_helper import (
-    REPORTS_PATH,
-    TEMP_PATH,
-)
+from docker_images_helper import DockerImage, get_docker_image, pull_image
+from env_helper import REPORT_PATH, TEMP_PATH
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResult
@@ -69,10 +67,13 @@ def main():
     stopwatch = Stopwatch()
 
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
-    reports_path = Path(REPORTS_PATH)
 
-    check_name = sys.argv[1]
+    check_name = sys.argv[1] if len(sys.argv) > 1 else os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
 
     pr_info = PRInfo()
 
@@ -84,7 +85,7 @@ def main():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    docker_image = get_image_with_version(reports_path, IMAGE_NAME)
+    docker_image = pull_image(get_docker_image(IMAGE_NAME))
 
     build_name = get_build_name_for_check(check_name)
     urls = read_build_urls(build_name, reports_path)
@@ -208,7 +209,9 @@ def main():
 
     logging.info("Result: '%s', '%s', '%s'", status, description, report_url)
     print(f"::notice ::Report url: {report_url}")
-    post_commit_status(commit, status, report_url, description, check_name, pr_info)
+    post_commit_status(
+        commit, status, report_url, description, check_name, pr_info, dump_to_file=True
+    )
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/autoscale_runners_lambda/app.py b/tests/ci/autoscale_runners_lambda/app.py
index fcbf0977cdf..120126b404a 100644
--- a/tests/ci/autoscale_runners_lambda/app.py
+++ b/tests/ci/autoscale_runners_lambda/app.py
@@ -56,22 +56,16 @@ def get_scales(runner_type: str) -> Tuple[int, int]:
     "returns the multipliers for scaling down and up ASG by types"
     # Scaling down is quicker on the lack of running jobs than scaling up on
     # queue
-    scale_down = 2
+
+    # The ASG should deflate almost instantly
+    scale_down = 1
+    # the style checkers have so many noise, so it scales up too quickly
+    # The 5 was too quick, there are complainings regarding too slow with
+    # 10. I am trying 7 now.
+    # 7 still looks a bit slow, so I try 6
+    # Let's have it the same as the other ASG
+    # UPDATE THE COMMENT ON CHANGES
     scale_up = 3
-    if runner_type == "style-checker":
-        # The ASG should deflate almost instantly
-        scale_down = 1
-        # the style checkers have so many noise, so it scales up too quickly
-        # The 5 was too quick, there are complainings regarding too slow with
-        # 10. I am trying 7 now.
-        # 7 still looks a bit slow, so I try 6
-        # Let's have it the same as the other ASG
-        # UPDATE THE COMMENT ON CHANGES
-        ## scale_down = 3
-    elif runner_type == "limited-tester":
-        # The limited runners should inflate and deflate faster
-        scale_down = 1
-        scale_up = 2
     return scale_down, scale_up
 
 
@@ -121,7 +115,9 @@ def set_capacity(
         # Are we already at the capacity limits
         stop = stop or asg["MaxSize"] <= asg["DesiredCapacity"]
         # Let's calculate a new desired capacity
-        desired_capacity = asg["DesiredCapacity"] + (capacity_deficit // scale_up)
+        desired_capacity = (
+            asg["DesiredCapacity"] + (capacity_deficit + scale_up - 1) // scale_up
+        )
         desired_capacity = max(desired_capacity, asg["MinSize"])
         desired_capacity = min(desired_capacity, asg["MaxSize"])
         # Finally, should the capacity be even changed
diff --git a/tests/ci/autoscale_runners_lambda/test_autoscale.py b/tests/ci/autoscale_runners_lambda/test_autoscale.py
index d9cda6272c5..464e5695556 100644
--- a/tests/ci/autoscale_runners_lambda/test_autoscale.py
+++ b/tests/ci/autoscale_runners_lambda/test_autoscale.py
@@ -69,14 +69,14 @@ class TestSetCapacity(unittest.TestCase):
             # Do not change capacity
             TestCase("noqueue", 1, 13, 20, [Queue("in_progress", 155, "noqueue")], -1),
             TestCase(
-                "w/reserve-1", 1, 13, 20, [Queue("queued", 15, "w/reserve-1")], -1
+                "w/reserve-1", 1, 13, 20, [Queue("queued", 15, "w/reserve-1")], 14
             ),
             # Increase capacity
-            TestCase("increase-1", 1, 13, 20, [Queue("queued", 23, "increase-1")], 16),
+            TestCase("increase-1", 1, 13, 20, [Queue("queued", 23, "increase-1")], 17),
             TestCase(
-                "style-checker", 1, 13, 20, [Queue("queued", 33, "style-checker")], 19
+                "style-checker", 1, 13, 20, [Queue("queued", 33, "style-checker")], 20
             ),
-            TestCase("increase-2", 1, 13, 20, [Queue("queued", 18, "increase-2")], 14),
+            TestCase("increase-2", 1, 13, 20, [Queue("queued", 18, "increase-2")], 15),
             TestCase("increase-3", 1, 13, 20, [Queue("queued", 183, "increase-3")], 20),
             TestCase(
                 "increase-w/o reserve",
@@ -87,16 +87,16 @@ class TestSetCapacity(unittest.TestCase):
                     Queue("in_progress", 11, "increase-w/o reserve"),
                     Queue("queued", 12, "increase-w/o reserve"),
                 ],
-                16,
+                17,
             ),
             TestCase("lower-min", 10, 5, 20, [Queue("queued", 5, "lower-min")], 10),
             # Decrease capacity
-            TestCase("w/reserve", 1, 13, 20, [Queue("queued", 5, "w/reserve")], 9),
+            TestCase("w/reserve", 1, 13, 20, [Queue("queued", 5, "w/reserve")], 5),
             TestCase(
                 "style-checker", 1, 13, 20, [Queue("queued", 5, "style-checker")], 5
             ),
-            TestCase("w/reserve", 1, 23, 20, [Queue("queued", 17, "w/reserve")], 20),
-            TestCase("decrease", 1, 13, 20, [Queue("in_progress", 3, "decrease")], 8),
+            TestCase("w/reserve", 1, 23, 20, [Queue("queued", 17, "w/reserve")], 17),
+            TestCase("decrease", 1, 13, 20, [Queue("in_progress", 3, "decrease")], 3),
             TestCase(
                 "style-checker",
                 1,
diff --git a/tests/ci/bugfix_validate_check.py b/tests/ci/bugfix_validate_check.py
index c5fc39fe33c..adb798bd392 100644
--- a/tests/ci/bugfix_validate_check.py
+++ b/tests/ci/bugfix_validate_check.py
@@ -36,6 +36,18 @@ def process_result(file_path: Path) -> Tuple[bool, TestResults]:
     test_results = []  # type: TestResults
     state, report_url, description = post_commit_status_from_file(file_path)
     prefix = file_path.parent.name
+    if description.strip() in [
+        "Invalid check_status.tsv",
+        "Not found test_results.tsv",
+        "Empty test_results.tsv",
+    ]:
+        status = (
+            f'Check failed (<a href="{report_url}">Report</a>)'
+            if report_url != "null"
+            else "Check failed"
+        )
+        return False, [TestResult(f"{prefix}: {description}", status)]
+
     is_ok = state == "success"
     if is_ok and report_url == "null":
         return is_ok, test_results
@@ -70,19 +82,21 @@ def main():
 
     is_ok, test_results = process_all_results(status_files)
 
-    if not test_results:
-        logging.info("No results to upload")
-        return
-
     pr_info = PRInfo()
-    report_url = upload_results(
-        S3Helper(),
-        pr_info.number,
-        pr_info.sha,
-        test_results,
-        status_files,
-        check_name_with_group,
-    )
+    if not test_results:
+        description = "No results to upload"
+        report_url = ""
+        logging.info("No results to upload")
+    else:
+        description = "" if is_ok else "Changed tests don't reproduce the bug"
+        report_url = upload_results(
+            S3Helper(),
+            pr_info.number,
+            pr_info.sha,
+            test_results,
+            status_files,
+            check_name_with_group,
+        )
 
     gh = Github(get_best_robot_token(), per_page=100)
     commit = get_commit(gh, pr_info.sha)
@@ -90,9 +104,10 @@ def main():
         commit,
         "success" if is_ok else "error",
         report_url,
-        "" if is_ok else "Changed tests don't reproduce the bug",
+        description,
         check_name_with_group,
         pr_info,
+        dump_to_file=True,
     )
 
 
diff --git a/tests/ci/build_check.py b/tests/ci/build_check.py
index adbd67bd95a..27243aac4f1 100644
--- a/tests/ci/build_check.py
+++ b/tests/ci/build_check.py
@@ -1,5 +1,6 @@
 #!/usr/bin/env python3
 
+import argparse
 from pathlib import Path
 from typing import Tuple
 import subprocess
@@ -8,11 +9,10 @@ import sys
 import time
 
 from ci_config import CI_CONFIG, BuildConfig
-from ccache_utils import CargoCache
-from docker_pull_helper import get_image_with_version
+from cache_utils import CargoCache
+
 from env_helper import (
     GITHUB_JOB_API_URL,
-    IMAGES_PATH,
     REPO_COPY,
     S3_BUILDS_BUCKET,
     S3_DOWNLOAD,
@@ -23,6 +23,7 @@ from pr_info import PRInfo
 from report import BuildResult, FAILURE, StatusType, SUCCESS
 from s3_helper import S3Helper
 from tee_popen import TeePopen
+import docker_images_helper
 from version_helper import (
     ClickHouseVersion,
     get_version_from_repo,
@@ -223,11 +224,22 @@ def upload_master_static_binaries(
     print(f"::notice ::Binary static URL (compact): {url_compact}")
 
 
+def parse_args() -> argparse.Namespace:
+    parser = argparse.ArgumentParser("Clickhouse builder script")
+    parser.add_argument(
+        "build_name",
+        help="build name",
+    )
+    return parser.parse_args()
+
+
 def main():
     logging.basicConfig(level=logging.INFO)
 
+    args = parse_args()
+
     stopwatch = Stopwatch()
-    build_name = sys.argv[1]
+    build_name = args.build_name
 
     build_config = CI_CONFIG.build_config[build_name]
 
@@ -250,15 +262,13 @@ def main():
         (performance_pr, pr_info.sha, build_name, "performance.tar.zst")
     )
 
+    # FIXME: to be removed in favor of "skip by job digest"
     # If this is rerun, then we try to find already created artifacts and just
     # put them as github actions artifact (result)
     # The s3_path_prefix has additional "/" in the end to prevent finding
     # e.g. `binary_darwin_aarch64/clickhouse` for `binary_darwin`
     check_for_success_run(s3_helper, f"{s3_path_prefix}/", build_name, version)
 
-    docker_image = get_image_with_version(IMAGES_PATH, IMAGE_NAME)
-    image_version = docker_image.version
-
     logging.info("Got version from repo %s", version.string)
 
     official_flag = pr_info.number == 0
@@ -281,13 +291,17 @@ def main():
     )
     cargo_cache.download()
 
+    docker_image = docker_images_helper.pull_image(
+        docker_images_helper.get_docker_image(IMAGE_NAME)
+    )
+
     packager_cmd = get_packager_cmd(
         build_config,
         repo_path / "docker" / "packager",
         build_output_path,
         cargo_cache.directory,
         version.string,
-        image_version,
+        docker_image.version,
         official_flag,
     )
 
diff --git a/tests/ci/build_report_check.py b/tests/ci/build_report_check.py
index d6368d7d3b3..d9925725eec 100644
--- a/tests/ci/build_report_check.py
+++ b/tests/ci/build_report_check.py
@@ -6,6 +6,7 @@ import os
 import sys
 import atexit
 from pathlib import Path
+from typing import List
 
 from github import Github
 
@@ -13,8 +14,8 @@ from env_helper import (
     GITHUB_JOB_URL,
     GITHUB_REPOSITORY,
     GITHUB_SERVER_URL,
-    REPORTS_PATH,
     TEMP_PATH,
+    REPORT_PATH,
 )
 from report import (
     BuildResult,
@@ -26,7 +27,7 @@ from report import (
 )
 from s3_helper import S3Helper
 from get_robot_token import get_best_robot_token
-from pr_info import NeedsDataType, PRInfo
+from pr_info import PRInfo
 from commit_status_helper import (
     RerunHelper,
     format_description,
@@ -46,52 +47,51 @@ NEEDS_DATA = os.getenv("NEEDS_DATA", "")
 def main():
     logging.basicConfig(level=logging.INFO)
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
 
-    logging.info("Reports path %s", REPORTS_PATH)
-    reports_path = Path(REPORTS_PATH)
     logging.info(
         "Reports found:\n %s",
         "\n ".join(p.as_posix() for p in reports_path.rglob("*.json")),
     )
 
     build_check_name = sys.argv[1]
-    needs_data = {}  # type: NeedsDataType
+    needs_data: List[str] = []
     required_builds = 0
-    if os.path.exists(NEEDS_DATA_PATH):
-        with open(NEEDS_DATA_PATH, "rb") as file_handler:
-            needs_data = json.load(file_handler)
 
     if NEEDS_DATA:
         needs_data = json.loads(NEEDS_DATA)
+        # drop non build jobs if any
+        needs_data = [d for d in needs_data if "Build" in d]
+    elif os.path.exists(NEEDS_DATA_PATH):
+        with open(NEEDS_DATA_PATH, "rb") as file_handler:
+            needs_data = list(json.load(file_handler).keys())
+    else:
+        assert False, "NEEDS_DATA env var required"
 
     required_builds = len(needs_data)
 
     if needs_data:
         logging.info("The next builds are required: %s", ", ".join(needs_data))
-        if all(i["result"] == "skipped" for i in needs_data.values()):
-            logging.info("All builds are skipped, exiting")
-            sys.exit(0)
 
     gh = Github(get_best_robot_token(), per_page=100)
     pr_info = PRInfo()
     commit = get_commit(gh, pr_info.sha)
 
-    atexit.register(update_mergeable_check, gh, pr_info, build_check_name)
+    atexit.register(update_mergeable_check, commit, pr_info, build_check_name)
 
     rerun_helper = RerunHelper(commit, build_check_name)
     if rerun_helper.is_already_finished_by_status():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    builds_for_check = CI_CONFIG.builds_report_config[build_check_name]
+    builds_for_check = CI_CONFIG.get_builds_for_report(build_check_name)
     required_builds = required_builds or len(builds_for_check)
 
     # Collect reports from json artifacts
     build_results = []
     for build_name in builds_for_check:
-        report_name = BuildResult.get_report_name(build_name).stem
-        build_result = BuildResult.read_json(reports_path / report_name, build_name)
+        build_result = BuildResult.read_json(reports_path, build_name)
         if build_result.is_missing:
             logging.warning("Build results for %s are missing", build_name)
             continue
@@ -179,7 +179,13 @@ def main():
     )
 
     post_commit_status(
-        commit, summary_status, url, description, build_check_name, pr_info
+        commit,
+        summary_status,
+        url,
+        description,
+        build_check_name,
+        pr_info,
+        dump_to_file=True,
     )
 
     if summary_status == ERROR:
diff --git a/tests/ci/ccache_utils.py b/tests/ci/cache_utils.py
similarity index 63%
rename from tests/ci/ccache_utils.py
rename to tests/ci/cache_utils.py
index 6ccaa8c80e0..0906b1d14e5 100644
--- a/tests/ci/ccache_utils.py
+++ b/tests/ci/cache_utils.py
@@ -5,12 +5,10 @@ import os
 import shutil
 from pathlib import Path
 
-import requests  # type: ignore
-
-from build_download_helper import download_build_with_progress, DownloadException
-from compress_files import decompress_fast, compress_fast
+from build_download_helper import DownloadException, download_build_with_progress
+from compress_files import compress_fast, decompress_fast
 from digest_helper import digest_path
-from env_helper import S3_DOWNLOAD, S3_BUILDS_BUCKET
+from env_helper import S3_BUILDS_BUCKET, S3_DOWNLOAD
 from git_helper import git_runner
 from s3_helper import S3Helper
 
@@ -98,7 +96,67 @@ def upload_ccache(
     logging.info("Upload finished")
 
 
-class CargoCache:
+class CacheError(Exception):
+    pass
+
+
+class Cache:
+    """a generic class for all caches"""
+
+    def __init__(
+        self,
+        directory: Path,
+        temp_path: Path,
+        archive_name: str,
+        s3_helper: S3Helper,
+    ):
+        self.directory = directory
+        self.temp_path = temp_path
+        self.archive_name = archive_name
+        self.s3_helper = s3_helper
+
+    def _download(self, url: str, ignore_error: bool = False) -> None:
+        compressed_cache = self.temp_path / self.archive_name
+        try:
+            download_build_with_progress(url, compressed_cache)
+        except DownloadException as e:
+            if not ignore_error:
+                raise CacheError(f"Failed to download {url}") from e
+            logging.warning("Unable downloading cache, creating empty directory")
+            self.directory.mkdir(parents=True, exist_ok=True)
+            return
+
+        # decompress the cache and check if the necessary directory is there
+        self.directory.parent.mkdir(parents=True, exist_ok=True)
+        decompress_fast(compressed_cache, self.directory.parent)
+        if not self.directory.exists():
+            if not ignore_error:
+                raise CacheError(
+                    "The cache is downloaded and uncompressed, but directory "
+                    f"{self.directory} does not exist"
+                )
+            logging.warning(
+                "The cache archive was successfully downloaded and "
+                "decompressed, but %s does not exitst. Creating empty one",
+                self.directory,
+            )
+            self.directory.mkdir(parents=True, exist_ok=True)
+
+    def _upload(self, s3_path: str, force_upload: bool = False) -> None:
+        if not force_upload:
+            existing_cache = self.s3_helper.list_prefix_non_recursive(s3_path)
+            if existing_cache:
+                logging.info("Remote cache %s already exist, won't reupload", s3_path)
+                return
+
+        logging.info("Compressing cargo cache")
+        archive_path = self.temp_path / self.archive_name
+        compress_fast(self.directory, archive_path)
+        logging.info("Uploading %s to S3 path %s", archive_path, s3_path)
+        self.s3_helper.upload_build_file_to_s3(archive_path, s3_path)
+
+
+class CargoCache(Cache):
     PREFIX = "ccache/cargo_cache"
 
     def __init__(
@@ -107,51 +165,49 @@ class CargoCache:
         temp_path: Path,
         s3_helper: S3Helper,
     ):
-        self._cargo_lock_file = Path(git_runner.cwd) / "rust" / "Cargo.lock"
-        self.lock_hash = digest_path(self._cargo_lock_file).hexdigest()
-        self.directory = directory
-        self.archive_name = f"Cargo_cache_{self.lock_hash}.tar.zst"
-        self.temp_path = temp_path
-        self.s3_helper = s3_helper
-        self._url = (
-            f"{S3_DOWNLOAD}/{S3_BUILDS_BUCKET}/{self.PREFIX}/{self.archive_name}"
-        )
+        cargo_lock_file = Path(git_runner.cwd) / "rust" / "Cargo.lock"
+        self.lock_hash = digest_path(cargo_lock_file).hexdigest()
         self._force_upload_cache = False
+        super().__init__(
+            directory, temp_path, f"Cargo_cache_{self.lock_hash}.tar.zst", s3_helper
+        )
+        self._url = self.s3_helper.get_url(
+            S3_BUILDS_BUCKET, f"{self.PREFIX}/{self.archive_name}"
+        )
 
     def download(self):
         logging.info("Searching rust cache for Cargo.lock md5 %s", self.lock_hash)
-        compressed_cache = self.temp_path / self.archive_name
         try:
-            download_build_with_progress(self._url, compressed_cache)
-        except DownloadException:
+            self._download(self._url, False)
+        except CacheError:
             logging.warning("Unable downloading cargo cache, creating empty directory")
+            logging.info("Cache for Cargo.lock md5 %s will be uploaded", self.lock_hash)
+            self._force_upload_cache = True
             self.directory.mkdir(parents=True, exist_ok=True)
             return
 
-        # decompress the cache and check if the necessary directory is there
-        self.directory.parent.mkdir(parents=True, exist_ok=True)
-        decompress_fast(compressed_cache, self.directory.parent)
-        if not self.directory.exists():
-            logging.warning(
-                "The cargo cache archive was successfully downloaded and "
-                "decompressed, but %s does not exitst. Creating empty one",
-                self.directory,
-            )
-            logging.info("Cache for Cargo.lock md5 %s will be uploaded", self.lock_hash)
-            self.directory.mkdir(parents=True, exist_ok=True)
+    def upload(self):
+        self._upload(f"{self.PREFIX}/{self.archive_name}", self._force_upload_cache)
+
+
+class GitHubCache(Cache):
+    PREFIX = "ccache/github"
+
+    def __init__(
+        self,
+        directory: Path,
+        temp_path: Path,
+        s3_helper: S3Helper,
+    ):
+        self.force_upload = True
+        super().__init__(directory, temp_path, "GitHub.tar.zst", s3_helper)
+        self._url = self.s3_helper.get_url(
+            S3_BUILDS_BUCKET, f"{self.PREFIX}/{self.archive_name}"
+        )
+
+    def download(self):
+        logging.info("Searching cache for GitHub class")
+        self._download(self._url, True)
 
     def upload(self):
-        if not self._force_upload_cache:
-            cache_response = requests.head(self._url)
-            if cache_response.status_code == 200:
-                logging.info(
-                    "Remote cargo cache %s already exist, won't reupload", self._url
-                )
-                return
-
-        logging.info("Compressing cargo cache")
-        archive_path = self.directory.parent / self.archive_name
-        compress_fast(self.directory, archive_path)
-        s3_path = f"{self.PREFIX}/{self.archive_name}"
-        logging.info("Uploading %s to S3 path %s", archive_path, s3_path)
-        self.s3_helper.upload_build_file_to_s3(archive_path, s3_path)
+        self._upload(f"{self.PREFIX}/{self.archive_name}", True)
diff --git a/tests/ci/cherry_pick.py b/tests/ci/cherry_pick.py
index bf4fdc332d8..93677c2c07b 100644
--- a/tests/ci/cherry_pick.py
+++ b/tests/ci/cherry_pick.py
@@ -35,12 +35,7 @@ from typing import List, Optional
 from env_helper import TEMP_PATH
 from get_robot_token import get_best_robot_token
 from git_helper import git_runner, is_shallow
-from github_helper import (
-    GitHub,
-    PullRequest,
-    PullRequests,
-    Repository,
-)
+from github_helper import GitHub, PullRequest, PullRequests, Repository
 from ssh import SSHKey
 
 
@@ -423,7 +418,9 @@ class Backport:
             logging.info("Fetching from %s", self._fetch_from)
             fetch_from_repo = self.gh.get_repo(self._fetch_from)
             git_runner(
-                f"git fetch {fetch_from_repo.ssh_url if self.is_remote_ssh else fetch_from_repo.clone_url} {fetch_from_repo.default_branch} --no-tags"
+                "git fetch "
+                f"{fetch_from_repo.ssh_url if self.is_remote_ssh else fetch_from_repo.clone_url} "
+                f"{fetch_from_repo.default_branch} --no-tags"
             )
 
         logging.info("Active releases: %s", ", ".join(self.release_branches))
@@ -443,7 +440,7 @@ class Backport:
             logging.info("Resetting %s to %s/%s", branch, self.remote, branch)
             git_runner(f"git branch -f {branch} {self.remote}/{branch}")
 
-    def receive_prs_for_backport(self):
+    def receive_prs_for_backport(self, reserve_search_days: int) -> None:
         # The commits in the oldest open release branch
         oldest_branch_commits = git_runner(
             "git log --no-merges --format=%H --reverse "
@@ -453,16 +450,18 @@ class Backport:
         since_commit = oldest_branch_commits.split("\n", 1)[0]
         since_date = date.fromisoformat(
             git_runner.run(f"git log -1 --format=format:%cs {since_commit}")
-        )
+        ) - timedelta(days=reserve_search_days)
         # To not have a possible TZ issues
         tomorrow = date.today() + timedelta(days=1)
         logging.info("Receive PRs suppose to be backported")
 
-        self.prs_for_backport = self.gh.get_pulls_from_search(
+        query_args = dict(
             query=f"type:pr repo:{self._fetch_from} -label:{self.backport_created_label}",
             label=",".join(self.labels_to_backport + [self.must_create_backport_label]),
             merged=[since_date, tomorrow],
         )
+        logging.info("Query to find the backport PRs:\n %s", query_args)
+        self.prs_for_backport = self.gh.get_pulls_from_search(**query_args)
         logging.info(
             "PRs to be backported:\n %s",
             "\n ".join([pr.html_url for pr in self.prs_for_backport]),
@@ -584,13 +583,18 @@ def parse_args():
         choices=(Labels.MUST_BACKPORT, Labels.MUST_BACKPORT_CLOUD),
         help="label to filter PRs to backport",
     )
-
     parser.add_argument(
         "--backport-created-label",
         default=Labels.BACKPORTS_CREATED,
         choices=(Labels.BACKPORTS_CREATED, Labels.BACKPORTS_CREATED_CLOUD),
         help="label to mark PRs as backported",
     )
+    parser.add_argument(
+        "--reserve-search-days",
+        default=0,
+        type=int,
+        help="safity reserve for the PRs search days, necessary for cloud",
+    )
 
     parser.add_argument(
         "--debug-helpers",
@@ -655,7 +659,7 @@ def main():
     bp.gh.cache_path = temp_path / "gh_cache"
     bp.receive_release_prs()
     bp.update_local_release_branches()
-    bp.receive_prs_for_backport()
+    bp.receive_prs_for_backport(args.reserve_search_days)
     bp.process_backports()
     if bp.error is not None:
         logging.error("Finished successfully, but errors occured!")
diff --git a/tests/ci/ci.py b/tests/ci/ci.py
new file mode 100644
index 00000000000..701f66b9a6a
--- /dev/null
+++ b/tests/ci/ci.py
@@ -0,0 +1,782 @@
+import argparse
+import concurrent.futures
+import json
+import os
+import re
+import subprocess
+import sys
+from pathlib import Path
+from typing import Any, Dict, Iterable, List, Optional
+
+import docker_images_helper
+from ci_config import CI_CONFIG
+from commit_status_helper import (
+    CommitStatusData,
+    format_description,
+    get_commit,
+    set_status_comment,
+)
+from digest_helper import DockerDigester, JobDigester
+from env_helper import CI, REPORT_PATH, ROOT_DIR, S3_BUILDS_BUCKET, TEMP_PATH
+from get_robot_token import get_best_robot_token
+from git_helper import GIT_PREFIX, Git
+from git_helper import Runner as GitRunner
+from github import Github
+from pr_info import PRInfo
+from report import BuildResult
+from s3_helper import S3Helper
+from version_helper import get_version_from_repo
+
+
+def get_check_name(check_name: str, batch: int, num_batches: int) -> str:
+    res = check_name
+    if num_batches > 1:
+        res = f"{check_name} [{batch+1}/{num_batches}]"
+    return res
+
+
+def normalize_check_name(check_name: str) -> str:
+    res = check_name.lower()
+    for r in ((" ", "_"), ("(", "_"), (")", "_"), (",", "_"), ("/", "_")):
+        res = res.replace(*r)
+    return res
+
+
+def is_build_job(job: str) -> bool:
+    if "package_" in job or "binary_" in job or job == "fuzzers":
+        return True
+    return False
+
+
+def is_test_job(job: str) -> bool:
+    return not is_build_job(job) and not "Style" in job and not "Docs check" in job
+
+
+def is_docs_job(job: str) -> bool:
+    return "Docs check" in job
+
+
+def parse_args(parser: argparse.ArgumentParser) -> argparse.Namespace:
+    # FIXME: consider switching to sub_parser for configure, pre, run, post actions
+    parser.add_argument(
+        "--configure",
+        action="store_true",
+        help="Action that configures ci run. Calculates digests, checks job to be executed, generates json output",
+    )
+    parser.add_argument(
+        "--update-gh-statuses",
+        action="store_true",
+        help="Action that recreate success GH statuses for jobs that finished successfully in past and will be skipped this time",
+    )
+    parser.add_argument(
+        "--pre",
+        action="store_true",
+        help="Action that executes prerequesetes for the job provided in --job-name",
+    )
+    parser.add_argument(
+        "--run",
+        action="store_true",
+        help="Action that executes run action for specified --job-name. run_command must be configured for a given job name.",
+    )
+    parser.add_argument(
+        "--post",
+        action="store_true",
+        help="Action that executes post actions for the job provided in --job-name",
+    )
+    parser.add_argument(
+        "--mark-success",
+        action="store_true",
+        help="Action that marks job provided in --job-name (with batch provided in --batch) as successful",
+    )
+    parser.add_argument(
+        "--job-name",
+        default="",
+        type=str,
+        help="Job name as in config",
+    )
+    parser.add_argument(
+        "--batch",
+        default=-1,
+        type=int,
+        help="Current batch number (required for --mark-success), -1 or omit for single-batch job",
+    )
+    parser.add_argument(
+        "--infile",
+        default="",
+        type=str,
+        help="Input json file or json string with ci run config",
+    )
+    parser.add_argument(
+        "--outfile",
+        default="",
+        type=str,
+        required=False,
+        help="output file to write json result to, if not set - stdout",
+    )
+    parser.add_argument(
+        "--pretty",
+        action="store_true",
+        default=False,
+        help="makes json output pretty formatted",
+    )
+    parser.add_argument(
+        "--skip-docker",
+        action="store_true",
+        default=False,
+        help="skip fetching docker data from dockerhub, used in --configure action (for debugging)",
+    )
+    parser.add_argument(
+        "--docker-digest-or-latest",
+        action="store_true",
+        default=False,
+        help="temporary hack to fallback to latest if image with digest as a tag is not on docker hub",
+    )
+    parser.add_argument(
+        "--skip-jobs",
+        action="store_true",
+        default=False,
+        help="skip fetching data about job runs, used in --configure action (for debugging and nigthly ci)",
+    )
+    parser.add_argument(
+        "--rebuild-all-docker",
+        action="store_true",
+        default=False,
+        help="will create run config for rebuilding all dockers, used in --configure action (for nightly docker job)",
+    )
+    parser.add_argument(
+        "--rebuild-all-binaries",
+        action="store_true",
+        default=False,
+        help="will create run config without skipping build jobs in any case, used in --configure action (for release branches)",
+    )
+    return parser.parse_args()
+
+
+def get_file_flag_name(
+    job_name: str, digest: str, batch: int = 0, num_batches: int = 1
+) -> str:
+    if num_batches < 2:
+        return f"job_{job_name}_{digest}.ci"
+    else:
+        return f"job_{job_name}_{digest}_{batch}_{num_batches}.ci"
+
+
+def get_s3_path(build_digest: str) -> str:
+    return f"CI_data/BUILD-{build_digest}/"
+
+
+def get_s3_path_docs(digest: str) -> str:
+    return f"CI_data/DOCS-{digest}/"
+
+
+def check_missing_images_on_dockerhub(
+    image_name_tag: Dict[str, str], arch: Optional[str] = None
+) -> Dict[str, str]:
+    """
+    Checks missing images on dockerhub.
+    Works concurrently for all given images.
+    Docker must be logged in.
+    """
+
+    def run_docker_command(
+        image: str, image_digest: str, arch: Optional[str] = None
+    ) -> Dict:
+        """
+        aux command for fetching single docker manifest
+        """
+        command = [
+            "docker",
+            "manifest",
+            "inspect",
+            f"{image}:{image_digest}" if not arch else f"{image}:{image_digest}-{arch}",
+        ]
+
+        process = subprocess.run(
+            command,
+            stdout=subprocess.PIPE,
+            stderr=subprocess.PIPE,
+            text=True,
+            check=False,
+        )
+
+        return {
+            "image": image,
+            "image_digest": image_digest,
+            "arch": arch,
+            "stdout": process.stdout,
+            "stderr": process.stderr,
+            "return_code": process.returncode,
+        }
+
+    result: Dict[str, str] = {}
+    with concurrent.futures.ThreadPoolExecutor() as executor:
+        futures = [
+            executor.submit(run_docker_command, image, tag, arch)
+            for image, tag in image_name_tag.items()
+        ]
+
+        responses = [
+            future.result() for future in concurrent.futures.as_completed(futures)
+        ]
+        for resp in responses:
+            name, stdout, stderr, digest, arch = (
+                resp["image"],
+                resp["stdout"],
+                resp["stderr"],
+                resp["image_digest"],
+                resp["arch"],
+            )
+            if stderr:
+                if stderr.startswith("no such manifest"):
+                    result[name] = digest
+                else:
+                    print(f"Error: Unknown error: {stderr}, {name}, {arch}")
+            elif stdout:
+                if "mediaType" in stdout:
+                    pass
+                else:
+                    print(f"Error: Unknown response: {stdout}")
+                    assert False, "FIXME"
+            else:
+                print(f"Error: No response for {name}, {digest}, {arch}")
+                assert False, "FIXME"
+    return result
+
+
+def _check_and_update_for_early_style_check(run_config: dict) -> None:
+    """
+    This is temporary hack to start style check before docker build if possible
+    FIXME: need better solution to do style check as soon as possible and as fast as possible w/o dependency on docker job
+    """
+    jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
+    docker_to_build = run_config.get("docker_data", {}).get("missing_multi", [])
+    if (
+        "Style check" in jobs_to_do
+        and docker_to_build
+        and "clickhouse/style-test" not in docker_to_build
+    ):
+        index = jobs_to_do.index("Style check")
+        jobs_to_do[index] = "Style check early"
+
+
+def _update_config_for_docs_only(run_config: dict) -> None:
+    DOCS_CHECK_JOBS = ["Docs check", "Style check"]
+    print(f"NOTE: Will keep only docs related jobs: [{DOCS_CHECK_JOBS}]")
+    jobs_to_do = run_config.get("jobs_data", {}).get("jobs_to_do", [])
+    run_config["jobs_data"]["jobs_to_do"] = [
+        job for job in jobs_to_do if job in DOCS_CHECK_JOBS
+    ]
+
+
+def _configure_docker_jobs(
+    rebuild_all_dockers: bool, docker_digest_or_latest: bool = False
+) -> Dict:
+    # generate docker jobs data
+    docker_digester = DockerDigester()
+    imagename_digest_dict = (
+        docker_digester.get_all_digests()
+    )  # 'image name - digest' mapping
+    images_info = docker_images_helper.get_images_info()
+
+    # a. check missing images
+    if not rebuild_all_dockers:
+        # FIXME: we need login as docker manifest inspect goes directly to one of the *.docker.com hosts instead of "registry-mirrors" : ["http://dockerhub-proxy.dockerhub-proxy-zone:5000"]
+        #         find if it's possible to use the setting of /etc/docker/daemon.json
+        docker_images_helper.docker_login()
+        print("Start checking missing images in dockerhub")
+        missing_multi_dict = check_missing_images_on_dockerhub(imagename_digest_dict)
+        missing_multi = list(missing_multi_dict)
+        missing_amd64 = []
+        missing_aarch64 = []
+        if not docker_digest_or_latest:
+            # look for missing arm and amd images only among missing multiarch manifests @missing_multi_dict
+            # to avoid extra dockerhub api calls
+            missing_amd64 = list(
+                check_missing_images_on_dockerhub(missing_multi_dict, "amd64")
+            )
+            # FIXME: WA until full arm support: skip not supported arm images
+            missing_aarch64 = list(
+                check_missing_images_on_dockerhub(
+                    {
+                        im: digest
+                        for im, digest in missing_multi_dict.items()
+                        if not images_info[im]["only_amd64"]
+                    },
+                    "aarch64",
+                )
+            )
+        # FIXME: temporary hack, remove after transition to docker digest as tag
+        else:
+            if missing_multi:
+                print(
+                    f"WARNING: Missing images {list(missing_multi)} - fallback to latest tag"
+                )
+                for image in missing_multi:
+                    imagename_digest_dict[image] = "latest"
+        print("...checking missing images in dockerhub - done")
+    else:
+        # add all images to missing
+        missing_multi = list(imagename_digest_dict)
+        missing_amd64 = missing_multi
+        # FIXME: WA until full arm support: skip not supported arm images
+        missing_aarch64 = [
+            name
+            for name in imagename_digest_dict
+            if not images_info[name]["only_amd64"]
+        ]
+
+    return {
+        "images": imagename_digest_dict,
+        "missing_aarch64": missing_aarch64,
+        "missing_amd64": missing_amd64,
+        "missing_multi": missing_multi,
+    }
+
+
+def _configure_jobs(
+    build_digest: str,
+    docs_digest: str,
+    job_digester: JobDigester,
+    s3: S3Helper,
+    rebuild_all_binaries: bool,
+    pr_labels: Iterable[str],
+    commit_tokens: List[str],
+) -> Dict:
+    # a. digest each item from the config
+    job_digester = JobDigester()
+    jobs_params: Dict[str, Dict] = {}
+    jobs_to_do: List[str] = []
+    jobs_to_skip: List[str] = []
+    digests: Dict[str, str] = {}
+    print("Calculating job digests - start")
+    for job in CI_CONFIG.job_generator():
+        digest = job_digester.get_job_digest(CI_CONFIG.get_digest_config(job))
+        digests[job] = digest
+        print(f"    job [{job.rjust(50)}] has digest [{digest}]")
+    print("Calculating job digests - done")
+
+    # b. check if we have something done
+    path = get_s3_path(build_digest)
+    done_files = s3.list_prefix(path)
+    done_files = [file.split("/")[-1] for file in done_files]
+    print(f"S3 CI files for the build [{build_digest}]: {done_files}")
+    docs_path = get_s3_path_docs(docs_digest)
+    done_files_docs = s3.list_prefix(docs_path)
+    done_files_docs = [file.split("/")[-1] for file in done_files_docs]
+    print(f"S3 CI files for the docs [{docs_digest}]: {done_files_docs}")
+    done_files += done_files_docs
+    for job in digests:
+        digest = digests[job]
+        job_config = CI_CONFIG.get_job_config(job)
+        num_batches: int = job_config.num_batches
+        batches_to_do: List[int] = []
+
+        if job_config.run_by_label:
+            # this job controlled by label, add to todo if it's labe is set in pr
+            if job_config.run_by_label in pr_labels:
+                for batch in range(num_batches):  # type: ignore
+                    batches_to_do.append(batch)
+        elif job_config.run_always:
+            # always add to todo
+            batches_to_do.append(batch)
+        else:
+            # this job controlled by digest, add to todo if it's not successfully done before
+            for batch in range(num_batches):  # type: ignore
+                success_flag_name = get_file_flag_name(job, digest, batch, num_batches)
+                if success_flag_name not in done_files or (
+                    rebuild_all_binaries and is_build_job(job)
+                ):
+                    batches_to_do.append(batch)
+
+        if batches_to_do:
+            jobs_to_do.append(job)
+            jobs_params[job] = {
+                "batches": batches_to_do,
+                "num_batches": num_batches,
+            }
+        else:
+            jobs_to_skip += (job,)
+
+    if pr_labels:
+        jobs_requested_by_label = []  # type: List[str]
+        ci_controlling_labels = []  # type: List[str]
+        for label in pr_labels:
+            label_config = CI_CONFIG.get_label_config(label)
+            if label_config:
+                jobs_requested_by_label += label_config.run_jobs
+                ci_controlling_labels += [label]
+        if ci_controlling_labels:
+            print(f"NOTE: CI controlling labels are set: [{ci_controlling_labels}]")
+            print(
+                f"    :   following jobs will be executed: [{jobs_requested_by_label}]"
+            )
+            jobs_to_do = jobs_requested_by_label
+
+    if commit_tokens:
+        requested_jobs = [
+            token[len("#job_") :]
+            for token in commit_tokens
+            if token.startswith("#job_")
+        ]
+        if requested_jobs:
+            assert any(
+                len(x) > 1 for x in requested_jobs
+            ), f"Invalid job names requested [{requested_jobs}]"
+            jobs_to_do_requested = []
+            for job in requested_jobs:
+                job_with_parents = CI_CONFIG.get_job_with_parents(job)
+                # always add requested job itself, even if it could be skipped
+                jobs_to_do_requested.append(job_with_parents[0])
+                for parent in job_with_parents[1:]:
+                    if parent in jobs_to_do and parent not in jobs_to_do_requested:
+                        jobs_to_do_requested.append(parent)
+            print(
+                f"NOTE: Only specific job(s) were requested by commit message tokens: [{jobs_to_do_requested}]"
+            )
+            jobs_to_do = jobs_to_do_requested
+
+    return {
+        "digests": digests,
+        "jobs_to_do": jobs_to_do,
+        "jobs_to_skip": jobs_to_skip,
+        "jobs_params": jobs_params,
+    }
+
+
+def _update_gh_statuses(indata: Dict, s3: S3Helper) -> None:
+    # This action is required to re-create all GH statuses for skipped jobs, so that ci report can be generated afterwards
+    temp_path = Path(TEMP_PATH)
+    if not temp_path.exists():
+        temp_path.mkdir(parents=True, exist_ok=True)
+
+    # clean up before start
+    for file in temp_path.glob("*.ci"):
+        file.unlink()
+
+    # download all metadata files
+    path = get_s3_path(indata["build"])
+    files = s3.download_files(  # type: ignore
+        bucket=S3_BUILDS_BUCKET,
+        s3_path=path,
+        file_suffix=".ci",
+        local_directory=temp_path,
+    )
+    print(f"CI metadata files [{files}]")
+    path = get_s3_path_docs(indata["docs"])
+    files_docs = s3.download_files(  # type: ignore
+        bucket=S3_BUILDS_BUCKET,
+        s3_path=path,
+        file_suffix=".ci",
+        local_directory=temp_path,
+    )
+    print(f"CI docs metadata files [{files_docs}]")
+    files += files_docs
+
+    # parse CI metadata
+    job_digests = indata["jobs_data"]["digests"]
+    # create GH status
+    pr_info = PRInfo()
+    commit = get_commit(Github(get_best_robot_token(), per_page=100), pr_info.sha)
+
+    def run_create_status(job, digest, batch, num_batches):
+        success_flag_name = get_file_flag_name(job, digest, batch, num_batches)
+        if success_flag_name in files:
+            print(f"Going to re-create GH status for job [{job}] sha [{pr_info.sha}]")
+            job_status = CommitStatusData.load_from_file(
+                f"{TEMP_PATH}/{success_flag_name}"
+            )  # type: CommitStatusData
+            assert job_status.status == "success", "BUG!"
+            commit.create_status(
+                state=job_status.status,
+                target_url=job_status.report_url,
+                description=format_description(
+                    f"Reused from [{job_status.pr_num}-{job_status.sha[0:8]}]: "
+                    f"{job_status.description}"
+                ),
+                context=get_check_name(job, batch=batch, num_batches=num_batches),
+            )
+            print(f"GH status re-created from file [{success_flag_name}]")
+
+    with concurrent.futures.ThreadPoolExecutor() as executor:
+        futures = []
+        for job in job_digests:
+            if is_build_job(job):
+                # no GH status for build jobs
+                continue
+            digest = job_digests[job]
+            num_batches = CI_CONFIG.get_job_config(job).num_batches
+            for batch in range(num_batches):
+                future = executor.submit(
+                    run_create_status, job, digest, batch, num_batches
+                )
+                futures.append(future)
+        done, _ = concurrent.futures.wait(futures)
+        for future in done:
+            try:
+                _ = future.result()
+            except Exception as e:
+                raise e
+    print("Going to update overall CI report")
+    set_status_comment(commit, pr_info)
+    print("... CI report update - done")
+
+    # clean up
+    ci_files = list(temp_path.glob("*.ci"))
+    for file in ci_files:
+        file.unlink()
+
+
+def _fetch_commit_tokens(message: str) -> List[str]:
+    pattern = r"#[\w-]+"
+    matches = re.findall(pattern, message)
+    res = [
+        match
+        for match in matches
+        if match == "#no-merge-commit"
+        or match.startswith("#job_")
+        or match.startswith("#job-")
+    ]
+    return res
+
+
+def main() -> int:
+    exit_code = 0
+    parser = argparse.ArgumentParser(
+        formatter_class=argparse.ArgumentDefaultsHelpFormatter,
+    )
+    args = parse_args(parser)
+
+    if args.mark_success or args.pre or args.post or args.run:
+        assert args.infile, "Run config must be provided via --infile"
+        assert args.job_name, "Job name must be provided via --job-name"
+
+    indata: Optional[Dict[str, Any]] = None
+    if args.infile:
+        indata = (
+            json.loads(args.infile)
+            if not os.path.isfile(args.infile)
+            else json.load(open(args.infile))
+        )
+        assert indata and isinstance(indata, dict), "Invalid --infile json"
+
+    result: Dict[str, Any] = {}
+    s3 = S3Helper()
+
+    if args.configure:
+        GR = GitRunner()
+        pr_info = PRInfo()
+
+        docker_data = {}
+        git_ref = GR.run(f"{GIT_PREFIX} rev-parse HEAD")
+
+        # if '#no-merge-commit' is set in commit message - set git ref to PR branch head to avoid merge-commit
+        tokens = []
+        if pr_info.number != 0 and not args.skip_jobs:
+            message = GR.run(f"{GIT_PREFIX} log {pr_info.sha} --format=%B -n 1")
+            tokens = _fetch_commit_tokens(message)
+            print(f"Found commit message tokens: [{tokens}]")
+            if "#no-merge-commit" in tokens and CI:
+                GR.run(f"{GIT_PREFIX} checkout {pr_info.sha}")
+                git_ref = GR.run(f"{GIT_PREFIX} rev-parse HEAD")
+                print(
+                    "#no-merge-commit is set in commit message - Setting git ref to PR branch HEAD to not use merge commit"
+                )
+
+        # let's get CH version
+        version = get_version_from_repo(git=Git(True)).string
+        print(f"Got CH version for this commit: [{version}]")
+
+        docker_data = (
+            _configure_docker_jobs(
+                args.rebuild_all_docker, args.docker_digest_or_latest
+            )
+            if not args.skip_docker
+            else {}
+        )
+
+        job_digester = JobDigester()
+        build_digest = job_digester.get_job_digest(
+            CI_CONFIG.get_digest_config("package_release")
+        )
+        docs_digest = job_digester.get_job_digest(
+            CI_CONFIG.get_digest_config("Docs check")
+        )
+        jobs_data = (
+            _configure_jobs(
+                build_digest,
+                docs_digest,
+                job_digester,
+                s3,
+                args.rebuild_all_binaries,
+                pr_info.labels,
+                tokens,
+            )
+            if not args.skip_jobs
+            else {}
+        )
+
+        # conclude results
+        result["git_ref"] = git_ref
+        result["version"] = version
+        result["build"] = build_digest
+        result["docs"] = docs_digest
+        result["jobs_data"] = jobs_data
+        result["docker_data"] = docker_data
+        if pr_info.number != 0 and not args.docker_digest_or_latest:
+            # FIXME: it runs style check before docker build if possible (style-check images is not changed)
+            #    find a way to do style check always before docker build and others
+            _check_and_update_for_early_style_check(result)
+        if pr_info.has_changes_in_documentation_only():
+            _update_config_for_docs_only(result)
+
+    elif args.update_gh_statuses:
+        assert indata, "Run config must be provided via --infile"
+        _update_gh_statuses(indata=indata, s3=s3)
+
+    elif args.pre:
+        # remove job status file if any
+        CommitStatusData.cleanup()
+
+        if is_test_job(args.job_name):
+            assert indata, "Run config must be provided via --infile"
+            report_path = Path(REPORT_PATH)
+            report_path.mkdir(exist_ok=True, parents=True)
+            path = get_s3_path(indata["build"])
+            files = s3.download_files(  # type: ignore
+                bucket=S3_BUILDS_BUCKET,
+                s3_path=path,
+                file_suffix=".json",
+                local_directory=report_path,
+            )
+            print(
+                f"Pre action done. Report files [{files}] have been downloaded from [{path}] to [{report_path}]"
+            )
+        else:
+            print(f"Pre action done. Nothing to do for [{args.job_name}]")
+
+    elif args.run:
+        assert CI_CONFIG.get_job_config(
+            args.job_name
+        ).run_command, f"Run command must be configured in CI_CONFIG for [{args.job_name}] or in GH workflow"
+        if CI_CONFIG.get_job_config(args.job_name).timeout:
+            os.environ["KILL_TIMEOUT"] = str(
+                CI_CONFIG.get_job_config(args.job_name).timeout
+            )
+        os.environ["CHECK_NAME"] = args.job_name
+        run_command = (
+            "./tests/ci/" + CI_CONFIG.get_job_config(args.job_name).run_command
+        )
+        if ".py" in run_command:
+            run_command = "python3 " + run_command
+        print(f"Going to start run command [{run_command}]")
+        process = subprocess.run(
+            run_command,
+            stdout=sys.stdout,
+            stderr=sys.stderr,
+            text=True,
+            check=False,
+            shell=True,
+        )
+        if process.returncode == 0:
+            print(f"Run action done for: [{args.job_name}]")
+        else:
+            print(
+                f"Run action failed for: [{args.job_name}] with exit code [{process.returncode}]"
+            )
+            exit_code = process.returncode
+
+    elif args.post:
+        if is_build_job(args.job_name):
+            report_path = Path(TEMP_PATH)  # build-check.py stores report in TEMP_PATH
+            assert report_path.is_dir(), f"File [{report_path}] is not a dir"
+            files = list(report_path.glob(f"*{args.job_name}.json"))  # type: ignore[arg-type]
+            assert len(files) == 1, f"Which is the report file: {files}?"
+            local_report = f"{files[0]}"
+            report_name = BuildResult.get_report_name(args.job_name)
+            assert indata
+            s3_path = Path(get_s3_path(indata["build"])) / report_name
+            report_url = s3.upload_file(
+                bucket=S3_BUILDS_BUCKET, file_path=local_report, s3_path=s3_path
+            )
+            print(
+                f"Post action done. Report file [{local_report}] has been uploaded to [{report_url}]"
+            )
+        else:
+            print(f"Post action done. Nothing to do for [{args.job_name}]")
+
+    elif args.mark_success:
+        assert indata, "Run config must be provided via --infile"
+        job = args.job_name
+        job_config = CI_CONFIG.get_job_config(job)
+        num_batches = job_config.num_batches
+        assert (
+            num_batches <= 1 or 0 <= args.batch < num_batches
+        ), f"--batch must be provided and in range [0, {num_batches}) for {job}"
+
+        # FIXME: find generic design for propagating and handling job status (e.g. stop using statuses in GH api)
+        #   now job ca be build job w/o status data, any other job that exit with 0 with or w/o status data
+        if is_build_job(job):
+            # there is no status for build jobs
+            # create dummy success to mark it as done
+            job_status = CommitStatusData(
+                status="success", description="dummy status", report_url="dummy_url"
+            )
+        else:
+            if not CommitStatusData.is_present():
+                # apparently exit after rerun-helper check
+                # do nothing, exit without failure
+                print(f"ERROR: no status file for job [{job}]")
+                job_status = CommitStatusData(
+                    status="dummy failure",
+                    description="dummy status",
+                    report_url="dummy_url",
+                )
+            else:
+                # normal case
+                job_status = CommitStatusData.load_status()
+
+        # Storing job data (report_url) to restore OK GH status on job results reuse
+        if job_config.run_always:
+            print(f"Job [{job}] runs always in CI - do not mark as done")
+        elif job_status.is_ok():
+            success_flag_name = get_file_flag_name(
+                job, indata["jobs_data"]["digests"][job], args.batch, num_batches
+            )
+            if not is_docs_job(job):
+                path = get_s3_path(indata["build"]) + success_flag_name
+            else:
+                path = get_s3_path_docs(indata["docs"]) + success_flag_name
+            job_status.dump_to_file(success_flag_name)
+            _ = s3.upload_file(
+                bucket=S3_BUILDS_BUCKET, file_path=success_flag_name, s3_path=path
+            )
+            os.remove(success_flag_name)
+            print(
+                f"Job [{job}] with digest [{indata['jobs_data']['digests'][job]}] {f'and batch {args.batch}/{num_batches}' if num_batches > 1 else ''} marked as successful. path: [{path}]"
+            )
+        else:
+            print(f"Job [{job}] is not ok, status [{job_status.status}]")
+
+    # print results
+    if args.outfile:
+        with open(args.outfile, "w") as f:
+            if isinstance(result, str):
+                print(result, file=f)
+            elif isinstance(result, dict):
+                print(json.dumps(result, indent=2 if args.pretty else None), file=f)
+            else:
+                raise AssertionError(f"Unexpected type for 'res': {type(result)}")
+    else:
+        if isinstance(result, str):
+            print(result)
+        elif isinstance(result, dict):
+            print(json.dumps(result, indent=2 if args.pretty else None))
+        else:
+            raise AssertionError(f"Unexpected type for 'res': {type(result)}")
+
+    return exit_code
+
+
+if __name__ == "__main__":
+    os.chdir(ROOT_DIR)
+    sys.exit(main())
diff --git a/tests/ci/ci_config.py b/tests/ci/ci_config.py
index d1d2021753e..031ab0be8a0 100644
--- a/tests/ci/ci_config.py
+++ b/tests/ci/ci_config.py
@@ -1,10 +1,58 @@
 #!/usr/bin/env python3
 
+from enum import Enum
 import logging
-
 from argparse import ArgumentDefaultsHelpFormatter, ArgumentParser
-from dataclasses import dataclass
-from typing import Callable, Dict, List, Literal, Union
+from dataclasses import dataclass, field
+from pathlib import Path
+from typing import Callable, Dict, Iterable, List, Literal, Optional, Union
+
+from integration_test_images import IMAGES
+
+
+class Labels(Enum):
+    DO_NOT_TEST_LABEL = "do not test"
+
+
+@dataclass
+class DigestConfig:
+    # all files, dirs to include into digest, glob supported
+    include_paths: List[Union[str, Path]] = field(default_factory=list)
+    # file suffixes to exclude from digest
+    exclude_files: List[str] = field(default_factory=list)
+    # directories to exlude from digest
+    exclude_dirs: List[Union[str, Path]] = field(default_factory=list)
+    # docker names to include into digest
+    docker: List[str] = field(default_factory=list)
+    # git submodules digest
+    git_submodules: bool = False
+
+
+@dataclass
+class LabelConfig:
+    """
+    class to configure different CI scenarious per GH label
+    """
+
+    run_jobs: Iterable[str] = frozenset()
+
+
+@dataclass
+class JobConfig:
+    """
+    contains config parameter relevant for job execution in CI workflow
+    @digest - configures digest calculation for the job
+    @run_command - will be triggered for the job if omited in CI workflow yml
+    @timeout
+    @num_batches - sets number of batches for multi-batch job
+    """
+
+    digest: DigestConfig = DigestConfig()
+    run_command: str = ""
+    timeout: Optional[int] = None
+    num_batches: int = 1
+    run_by_label: str = ""
+    run_always: bool = False
 
 
 @dataclass
@@ -19,6 +67,21 @@ class BuildConfig:
     sparse_checkout: bool = False
     comment: str = ""
     static_binary_name: str = ""
+    job_config: JobConfig = JobConfig(
+        digest=DigestConfig(
+            include_paths=[
+                "./src",
+                "./contrib/*-cmake",
+                "./cmake",
+                "./base",
+                "./programs",
+                "./packages",
+            ],
+            exclude_files=[".md"],
+            docker=["clickhouse/binary-builder"],
+            git_submodules=True,
+        ),
+    )
 
     def export_env(self, export: bool = False) -> str:
         def process(field_name: str, field: Union[bool, str]) -> str:
@@ -31,29 +94,276 @@ class BuildConfig:
         return "\n".join(process(k, v) for k, v in self.__dict__.items())
 
 
+@dataclass
+class BuildReportConfig:
+    builds: List[str]
+    job_config: JobConfig = JobConfig()
+
+
 @dataclass
 class TestConfig:
     required_build: str
     force_tests: bool = False
+    job_config: JobConfig = JobConfig()
 
 
 BuildConfigs = Dict[str, BuildConfig]
-BuildsReportConfig = Dict[str, List[str]]
+BuildsReportConfig = Dict[str, BuildReportConfig]
 TestConfigs = Dict[str, TestConfig]
+LabelConfigs = Dict[str, LabelConfig]
+
+# common digests configs
+compatibility_check_digest = DigestConfig(
+    include_paths=["./tests/ci/compatibility_check.py"],
+    docker=["clickhouse/test-old-ubuntu", "clickhouse/test-old-centos"],
+)
+install_check_digest = DigestConfig(
+    include_paths=["./tests/ci/install_check.py"],
+    docker=["clickhouse/install-deb-test", "clickhouse/install-rpm-test"],
+)
+statless_check_digest = DigestConfig(
+    include_paths=["./tests/queries/0_stateless/"],
+    exclude_files=[".md"],
+    docker=["clickhouse/stateless-test"],
+)
+stateful_check_digest = DigestConfig(
+    include_paths=["./tests/queries/1_stateful/"],
+    exclude_files=[".md"],
+    docker=["clickhouse/stateful-test"],
+)
+# FIXME: which tests are stresstest? stateless?
+stress_check_digest = DigestConfig(
+    include_paths=["./tests/queries/0_stateless/"],
+    exclude_files=[".md"],
+    docker=["clickhouse/stress-test"],
+)
+# FIXME: which tests are upgrade? just python?
+upgrade_check_digest = DigestConfig(
+    include_paths=["./tests/ci/upgrade_check.py"],
+    exclude_files=[".md"],
+    docker=["clickhouse/upgrade-check"],
+)
+integration_check_digest = DigestConfig(
+    include_paths=["./tests/ci/integration_test_check.py", "./tests/integration"],
+    exclude_files=[".md"],
+    docker=IMAGES.copy(),
+)
+
+ast_fuzzer_check_digest = DigestConfig(
+    # include_paths=["./tests/ci/ast_fuzzer_check.py"],
+    # exclude_files=[".md"],
+    # docker=["clickhouse/fuzzer"],
+)
+unit_check_digest = DigestConfig(
+    include_paths=["./tests/ci/unit_tests_check.py"],
+    exclude_files=[".md"],
+    docker=["clickhouse/unit-test"],
+)
+perf_check_digest = DigestConfig(
+    include_paths=[
+        "./tests/ci/performance_comparison_check.py",
+        "./tests/performance/",
+    ],
+    exclude_files=[".md"],
+    docker=["clickhouse/performance-comparison"],
+)
+sqllancer_check_digest = DigestConfig(
+    # include_paths=["./tests/ci/sqlancer_check.py"],
+    # exclude_files=[".md"],
+    # docker=["clickhouse/sqlancer-test"],
+)
+sqllogic_check_digest = DigestConfig(
+    include_paths=["./tests/ci/sqllogic_test.py"],
+    exclude_files=[".md"],
+    docker=["clickhouse/sqllogic-test"],
+)
+sqltest_check_digest = DigestConfig(
+    include_paths=["./tests/ci/sqltest.py"],
+    exclude_files=[".md"],
+    docker=["clickhouse/sqltest"],
+)
+bugfix_validate_check = DigestConfig(
+    include_paths=[
+        "./tests/queries/0_stateless/",
+        "./tests/ci/integration_test_check.py",
+        "./tests/ci/functional_test_check.py",
+        "./tests/ci/bugfix_validate_check.py",
+    ],
+    exclude_files=[".md"],
+    docker=IMAGES.copy()
+    + [
+        "clickhouse/stateless-test",
+    ],
+)
+# common test params
+statless_test_common_params = {
+    "digest": statless_check_digest,
+    "run_command": 'functional_test_check.py "$CHECK_NAME" $KILL_TIMEOUT',
+    "timeout": 10800,
+}
+stateful_test_common_params = {
+    "digest": stateful_check_digest,
+    "run_command": 'functional_test_check.py "$CHECK_NAME" $KILL_TIMEOUT',
+    "timeout": 3600,
+}
+stress_test_common_params = {
+    "digest": stress_check_digest,
+    "run_command": "stress_check.py",
+}
+upgrade_test_common_params = {
+    "digest": upgrade_check_digest,
+    "run_command": "upgrade_check.py",
+}
+astfuzzer_test_common_params = {
+    "digest": ast_fuzzer_check_digest,
+    "run_command": "ast_fuzzer_check.py",
+    "run_always": True,
+}
+integration_test_common_params = {
+    "digest": integration_check_digest,
+    "run_command": 'integration_test_check.py "$CHECK_NAME"',
+}
+unit_test_common_params = {
+    "digest": unit_check_digest,
+    "run_command": "unit_tests_check.py",
+}
+perf_test_common_params = {
+    "digest": perf_check_digest,
+    "run_command": "performance_comparison_check.py",
+}
+sqllancer_test_common_params = {
+    "digest": sqllancer_check_digest,
+    "run_command": "sqlancer_check.py",
+    "run_always": True,
+}
+sqllogic_test_params = {
+    "digest": sqllogic_check_digest,
+    "run_command": "sqllogic_test.py",
+    "timeout": 10800,
+}
+sql_test_params = {
+    "digest": sqltest_check_digest,
+    "run_command": "sqltest.py",
+    "timeout": 10800,
+}
 
 
 @dataclass
 class CiConfig:
+    """
+    Contains configs for ALL jobs in CI pipeline
+    each config item in the below dicts should be an instance of JobConfig class or inherited from it
+    """
+
     build_config: BuildConfigs
     builds_report_config: BuildsReportConfig
     test_configs: TestConfigs
+    other_jobs_configs: TestConfigs
+    label_configs: LabelConfigs
+
+    def get_label_config(self, label_name: str) -> Optional[LabelConfig]:
+        for label, config in self.label_configs.items():
+            if label_name == label:
+                return config
+        return None
+
+    def get_job_config(self, check_name: str) -> JobConfig:
+        res = None
+        for config in (
+            self.build_config,
+            self.builds_report_config,
+            self.test_configs,
+            self.other_jobs_configs,
+        ):
+            if check_name in config:  # type: ignore
+                res = config[check_name].job_config  # type: ignore
+                break
+        assert (
+            res is not None
+        ), f"Invalid check_name or CI_CONFIG outdated, config not found for [{check_name}]"
+        return res  # type: ignore
+
+    def get_job_with_parents(self, check_name: str) -> List[str]:
+        def _normalize_string(input_string: str) -> str:
+            lowercase_string = input_string.lower()
+            normalized_string = (
+                lowercase_string.replace(" ", "_")
+                .replace("-", "_")
+                .replace("(", "")
+                .replace(")", "")
+                .replace(",", "")
+            )
+            return normalized_string
+
+        res = []
+        check_name = _normalize_string(check_name)
+
+        for config in (
+            self.build_config,
+            self.builds_report_config,
+            self.test_configs,
+            self.other_jobs_configs,
+        ):
+            for job_name in config:  # type: ignore
+                if check_name == _normalize_string(job_name):
+                    res.append(job_name)
+                    if isinstance(config[job_name], TestConfig):  # type: ignore
+                        assert config[
+                            job_name
+                        ].required_build, f"Error: Experimantal feature... Not supported job [{job_name}]"  # type: ignore
+                        res.append(config[job_name].required_build)  # type: ignore
+                        res.append("Fast tests")
+                        res.append("Style check")
+                    elif isinstance(config[job_name], BuildConfig):  # type: ignore
+                        res.append("Fast tests")
+                        res.append("Style check")
+                    else:
+                        assert (
+                            False
+                        ), f"check commit message tags or FIXME: request for job [{check_name}] not yet supported"
+                    break
+        assert (
+            res
+        ), f"Error: Experimantal feature... Invlid request or not supported job [{check_name}]"
+        return res
+
+    def get_digest_config(self, check_name: str) -> DigestConfig:
+        res = None
+        for config in (
+            self.other_jobs_configs,
+            self.build_config,
+            self.builds_report_config,
+            self.test_configs,
+        ):
+            if check_name in config:  # type: ignore
+                res = config[check_name].job_config.digest  # type: ignore
+        assert (
+            res
+        ), f"Invalid check_name or CI_CONFIG outdated, config not found for [{check_name}]"
+        return res  # type: ignore
+
+    def job_generator(self) -> Iterable[str]:
+        """
+        traverses all check names in CI pipeline
+        """
+        for config in (
+            self.other_jobs_configs,
+            self.build_config,
+            self.builds_report_config,
+            self.test_configs,
+        ):
+            for check_name in config:  # type: ignore
+                yield check_name
+
+    def get_builds_for_report(self, report_name: str) -> List[str]:
+        return self.builds_report_config[report_name].builds
 
     def validate(self) -> None:
         errors = []
         for name, build_config in self.build_config.items():
             build_in_reports = False
-            for report_config in self.builds_report_config.values():
-                if name in report_config:
+            for _, report_config in self.builds_report_config.items():
+                if name in report_config.builds:
                     build_in_reports = True
                     break
             # All build configs must belong to build_report_config
@@ -71,7 +381,8 @@ class CiConfig:
                     f"Build name {name} does not match 'name' value '{build_config.name}'"
                 )
         # All build_report_config values should be in build_config.keys()
-        for build_report_name, build_names in self.builds_report_config.items():
+        for build_report_name, build_report_config in self.builds_report_config.items():
+            build_names = build_report_config.builds
             missed_names = [
                 name for name in build_names if name not in self.build_config.keys()
             ]
@@ -104,6 +415,9 @@ class CiConfig:
 
 
 CI_CONFIG = CiConfig(
+    label_configs={
+        Labels.DO_NOT_TEST_LABEL.value: LabelConfig(run_jobs=["Style check"]),
+    },
     build_config={
         "package_release": BuildConfig(
             name="package_release",
@@ -208,6 +522,13 @@ CI_CONFIG = CiConfig(
             static_binary_name="amd64compat",
             comment="SSE2-only build",
         ),
+        "binary_amd64_musl": BuildConfig(
+            name="binary_amd64_musl",
+            compiler="clang-17-amd64-musl",
+            package_type="binary",
+            static_binary_name="amd64musl",
+            comment="Build with Musl",
+        ),
         "binary_riscv64": BuildConfig(
             name="binary_riscv64",
             compiler="clang-17-riscv64",
@@ -227,101 +548,299 @@ CI_CONFIG = CiConfig(
         ),
     },
     builds_report_config={
-        "ClickHouse build check": [
-            "package_release",
-            "package_aarch64",
-            "package_asan",
-            "package_ubsan",
-            "package_tsan",
-            "package_msan",
-            "package_debug",
-            "binary_release",
-            "fuzzers",
-        ],
-        "ClickHouse special build check": [
-            "binary_tidy",
-            "binary_darwin",
-            "binary_aarch64",
-            "binary_aarch64_v80compat",
-            "binary_freebsd",
-            "binary_darwin_aarch64",
-            "binary_ppc64le",
-            "binary_riscv64",
-            "binary_s390x",
-            "binary_amd64_compat",
-        ],
+        "ClickHouse build check": BuildReportConfig(
+            builds=[
+                "package_release",
+                "package_aarch64",
+                "package_asan",
+                "package_ubsan",
+                "package_tsan",
+                "package_msan",
+                "package_debug",
+                "binary_release",
+                "fuzzers",
+            ]
+        ),
+        "ClickHouse special build check": BuildReportConfig(
+            builds=[
+                "binary_tidy",
+                "binary_darwin",
+                "binary_aarch64",
+                "binary_aarch64_v80compat",
+                "binary_freebsd",
+                "binary_darwin_aarch64",
+                "binary_ppc64le",
+                "binary_riscv64",
+                "binary_s390x",
+                "binary_amd64_compat",
+                "binary_amd64_musl",
+            ]
+        ),
+    },
+    other_jobs_configs={
+        "Docker server and keeper images": TestConfig(
+            "",
+            job_config=JobConfig(
+                digest=DigestConfig(
+                    include_paths=[
+                        "tests/ci/docker_server.py",
+                        "./docker/server",
+                        "./docker/keeper",
+                    ]
+                )
+            ),
+        ),
+        "Docs check": TestConfig(
+            "",
+            job_config=JobConfig(
+                digest=DigestConfig(
+                    include_paths=["**/*.md", "./docs", "tests/ci/docs_check.py"],
+                    docker=["clickhouse/docs-builder"],
+                ),
+            ),
+        ),
+        "Fast tests": TestConfig(
+            "",
+            job_config=JobConfig(
+                digest=DigestConfig(
+                    include_paths=["./tests/queries/0_stateless/"],
+                    exclude_files=[".md"],
+                    docker=["clickhouse/fasttest"],
+                )
+            ),
+        ),
+        "Style check": TestConfig(
+            "",
+            job_config=JobConfig(
+                run_always=True,
+            ),
+        ),
+        "tests bugfix validate check": TestConfig(
+            "",
+            # we run this check by label - no digest required
+            job_config=JobConfig(run_by_label="pr-bugfix"),
+        ),
     },
     test_configs={
-        "Install packages (amd64)": TestConfig("package_release"),
-        "Install packages (arm64)": TestConfig("package_aarch64"),
-        "Stateful tests (asan)": TestConfig("package_asan"),
-        "Stateful tests (tsan)": TestConfig("package_tsan"),
-        "Stateful tests (msan)": TestConfig("package_msan"),
-        "Stateful tests (ubsan)": TestConfig("package_ubsan"),
-        "Stateful tests (debug)": TestConfig("package_debug"),
-        "Stateful tests (release)": TestConfig("package_release"),
-        "Stateful tests (aarch64)": TestConfig("package_aarch64"),
-        "Stateful tests (release, DatabaseOrdinary)": TestConfig("package_release"),
-        "Stateful tests (release, DatabaseReplicated)": TestConfig("package_release"),
+        "Install packages (amd64)": TestConfig(
+            "package_release", job_config=JobConfig(digest=install_check_digest)
+        ),
+        "Install packages (arm64)": TestConfig(
+            "package_aarch64", job_config=JobConfig(digest=install_check_digest)
+        ),
+        "Stateful tests (asan)": TestConfig(
+            "package_asan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (tsan)": TestConfig(
+            "package_tsan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (msan)": TestConfig(
+            "package_msan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (ubsan)": TestConfig(
+            "package_ubsan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (debug)": TestConfig(
+            "package_debug", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (release)": TestConfig(
+            "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (aarch64)": TestConfig(
+            "package_aarch64", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (release, DatabaseOrdinary)": TestConfig(
+            "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        # "Stateful tests (release, DatabaseReplicated)": TestConfig(
+        #     "package_release", job_config=JobConfig(**stateful_test_common_params) # type: ignore
+        # ),
         # Stateful tests for parallel replicas
-        "Stateful tests (release, ParallelReplicas)": TestConfig("package_release"),
-        "Stateful tests (debug, ParallelReplicas)": TestConfig("package_debug"),
-        "Stateful tests (asan, ParallelReplicas)": TestConfig("package_asan"),
-        "Stateful tests (msan, ParallelReplicas)": TestConfig("package_msan"),
-        "Stateful tests (ubsan, ParallelReplicas)": TestConfig("package_ubsan"),
-        "Stateful tests (tsan, ParallelReplicas)": TestConfig("package_tsan"),
+        "Stateful tests (release, ParallelReplicas)": TestConfig(
+            "package_release", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (debug, ParallelReplicas)": TestConfig(
+            "package_debug", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (asan, ParallelReplicas)": TestConfig(
+            "package_asan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (msan, ParallelReplicas)": TestConfig(
+            "package_msan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (ubsan, ParallelReplicas)": TestConfig(
+            "package_ubsan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
+        "Stateful tests (tsan, ParallelReplicas)": TestConfig(
+            "package_tsan", job_config=JobConfig(**stateful_test_common_params)  # type: ignore
+        ),
         # End stateful tests for parallel replicas
-        "Stateless tests (asan)": TestConfig("package_asan"),
-        "Stateless tests (tsan)": TestConfig("package_tsan"),
-        "Stateless tests (msan)": TestConfig("package_msan"),
-        "Stateless tests (ubsan)": TestConfig("package_ubsan"),
-        "Stateless tests (debug)": TestConfig("package_debug"),
-        "Stateless tests (release)": TestConfig("package_release"),
-        "Stateless tests (aarch64)": TestConfig("package_aarch64"),
-        "Stateless tests (release, wide parts enabled)": TestConfig("package_release"),
-        "Stateless tests (release, analyzer)": TestConfig("package_release"),
-        "Stateless tests (release, DatabaseOrdinary)": TestConfig("package_release"),
-        "Stateless tests (release, DatabaseReplicated)": TestConfig("package_release"),
-        "Stateless tests (release, s3 storage)": TestConfig("package_release"),
-        "Stateless tests (debug, s3 storage)": TestConfig("package_debug"),
-        "Stateless tests (tsan, s3 storage)": TestConfig("package_tsan"),
-        "Stress test (asan)": TestConfig("package_asan"),
-        "Stress test (tsan)": TestConfig("package_tsan"),
-        "Stress test (ubsan)": TestConfig("package_ubsan"),
-        "Stress test (msan)": TestConfig("package_msan"),
-        "Stress test (debug)": TestConfig("package_debug"),
-        "Upgrade check (asan)": TestConfig("package_asan"),
-        "Upgrade check (tsan)": TestConfig("package_tsan"),
-        "Upgrade check (msan)": TestConfig("package_msan"),
-        "Upgrade check (debug)": TestConfig("package_debug"),
-        "Integration tests (asan)": TestConfig("package_asan"),
-        "Integration tests (asan, analyzer)": TestConfig("package_asan"),
-        "Integration tests (tsan)": TestConfig("package_tsan"),
-        "Integration tests (release)": TestConfig("package_release"),
-        "Integration tests (msan)": TestConfig("package_msan"),
-        "Integration tests flaky check (asan)": TestConfig("package_asan"),
-        "Compatibility check (amd64)": TestConfig("package_release"),
-        "Compatibility check (aarch64)": TestConfig("package_aarch64"),
-        "Unit tests (release)": TestConfig("binary_release"),
-        "Unit tests (asan)": TestConfig("package_asan"),
-        "Unit tests (msan)": TestConfig("package_msan"),
-        "Unit tests (tsan)": TestConfig("package_tsan"),
-        "Unit tests (ubsan)": TestConfig("package_ubsan"),
-        "AST fuzzer (debug)": TestConfig("package_debug"),
-        "AST fuzzer (asan)": TestConfig("package_asan"),
-        "AST fuzzer (msan)": TestConfig("package_msan"),
-        "AST fuzzer (tsan)": TestConfig("package_tsan"),
-        "AST fuzzer (ubsan)": TestConfig("package_ubsan"),
-        "Stateless tests flaky check (asan)": TestConfig("package_asan"),
+        "Stateless tests (asan)": TestConfig(
+            "package_asan",
+            job_config=JobConfig(num_batches=4, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (tsan)": TestConfig(
+            "package_tsan",
+            job_config=JobConfig(num_batches=5, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (msan)": TestConfig(
+            "package_msan",
+            job_config=JobConfig(num_batches=6, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (ubsan)": TestConfig(
+            "package_ubsan",
+            job_config=JobConfig(num_batches=2, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (debug)": TestConfig(
+            "package_debug",
+            job_config=JobConfig(num_batches=5, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (release)": TestConfig(
+            "package_release", job_config=JobConfig(**statless_test_common_params)  # type: ignore
+        ),
+        "Stateless tests (aarch64)": TestConfig(
+            "package_aarch64", job_config=JobConfig(**statless_test_common_params)  # type: ignore
+        ),
+        "Stateless tests (release, analyzer)": TestConfig(
+            "package_release", job_config=JobConfig(**statless_test_common_params)  # type: ignore
+        ),
+        "Stateless tests (release, DatabaseOrdinary)": TestConfig(
+            "package_release", job_config=JobConfig(**statless_test_common_params)  # type: ignore
+        ),
+        "Stateless tests (release, DatabaseReplicated)": TestConfig(
+            "package_release",
+            job_config=JobConfig(num_batches=4, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (release, s3 storage)": TestConfig(
+            "package_release",
+            job_config=JobConfig(num_batches=2, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (debug, s3 storage)": TestConfig(
+            "package_debug",
+            job_config=JobConfig(num_batches=6, **statless_test_common_params),  # type: ignore
+        ),
+        "Stateless tests (tsan, s3 storage)": TestConfig(
+            "package_tsan",
+            job_config=JobConfig(num_batches=5, **statless_test_common_params),  # type: ignore
+        ),
+        "Stress test (asan)": TestConfig(
+            "package_asan", job_config=JobConfig(**stress_test_common_params)  # type: ignore
+        ),
+        "Stress test (tsan)": TestConfig(
+            "package_tsan", job_config=JobConfig(**stress_test_common_params)  # type: ignore
+        ),
+        "Stress test (ubsan)": TestConfig(
+            "package_ubsan", job_config=JobConfig(**stress_test_common_params)  # type: ignore
+        ),
+        "Stress test (msan)": TestConfig(
+            "package_msan", job_config=JobConfig(**stress_test_common_params)  # type: ignore
+        ),
+        "Stress test (debug)": TestConfig(
+            "package_debug", job_config=JobConfig(**stress_test_common_params)  # type: ignore
+        ),
+        "Upgrade check (asan)": TestConfig(
+            "package_asan", job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+        ),
+        "Upgrade check (tsan)": TestConfig(
+            "package_tsan", job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+        ),
+        "Upgrade check (msan)": TestConfig(
+            "package_msan", job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+        ),
+        "Upgrade check (debug)": TestConfig(
+            "package_debug", job_config=JobConfig(**upgrade_test_common_params)  # type: ignore
+        ),
+        "Integration tests (asan)": TestConfig(
+            "package_asan",
+            job_config=JobConfig(num_batches=4, **integration_test_common_params),  # type: ignore
+        ),
+        "Integration tests (asan, analyzer)": TestConfig(
+            "package_asan",
+            job_config=JobConfig(num_batches=6, **integration_test_common_params),  # type: ignore
+        ),
+        "Integration tests (tsan)": TestConfig(
+            "package_tsan",
+            job_config=JobConfig(num_batches=6, **integration_test_common_params),  # type: ignore
+        ),
+        # FIXME: currently no wf has this job. Try to enable
+        # "Integration tests (msan)": TestConfig("package_msan", job_config=JobConfig(num_batches=6, **integration_test_common_params) # type: ignore
+        # ),
+        "Integration tests (release)": TestConfig(
+            "package_release",
+            job_config=JobConfig(num_batches=4, **integration_test_common_params),  # type: ignore
+        ),
+        "Integration tests flaky check (asan)": TestConfig(
+            "package_asan", job_config=JobConfig(**integration_test_common_params)  # type: ignore
+        ),
+        "Compatibility check (amd64)": TestConfig(
+            "package_release", job_config=JobConfig(digest=compatibility_check_digest)
+        ),
+        "Compatibility check (aarch64)": TestConfig(
+            "package_aarch64", job_config=JobConfig(digest=compatibility_check_digest)
+        ),
+        "Unit tests (release)": TestConfig(
+            "binary_release", job_config=JobConfig(**unit_test_common_params)  # type: ignore
+        ),
+        "Unit tests (asan)": TestConfig(
+            "package_asan", job_config=JobConfig(**unit_test_common_params)  # type: ignore
+        ),
+        "Unit tests (msan)": TestConfig(
+            "package_msan", job_config=JobConfig(**unit_test_common_params)  # type: ignore
+        ),
+        "Unit tests (tsan)": TestConfig(
+            "package_tsan", job_config=JobConfig(**unit_test_common_params)  # type: ignore
+        ),
+        "Unit tests (ubsan)": TestConfig(
+            "package_ubsan", job_config=JobConfig(**unit_test_common_params)  # type: ignore
+        ),
+        "AST fuzzer (debug)": TestConfig(
+            "package_debug", job_config=JobConfig(**astfuzzer_test_common_params)  # type: ignore
+        ),
+        "AST fuzzer (asan)": TestConfig(
+            "package_asan", job_config=JobConfig(**astfuzzer_test_common_params)  # type: ignore
+        ),
+        "AST fuzzer (msan)": TestConfig(
+            "package_msan", job_config=JobConfig(**astfuzzer_test_common_params)  # type: ignore
+        ),
+        "AST fuzzer (tsan)": TestConfig(
+            "package_tsan", job_config=JobConfig(**astfuzzer_test_common_params)  # type: ignore
+        ),
+        "AST fuzzer (ubsan)": TestConfig(
+            "package_ubsan", job_config=JobConfig(**astfuzzer_test_common_params)  # type: ignore
+        ),
+        "Stateless tests flaky check (asan)": TestConfig(
+            # replace to non-default
+            "package_asan",
+            job_config=JobConfig(**{**statless_test_common_params, "timeout": 3600}),  # type: ignore
+        ),
+        # FIXME: add digest and params
         "ClickHouse Keeper Jepsen": TestConfig("binary_release"),
+        # FIXME: add digest and params
         "ClickHouse Server Jepsen": TestConfig("binary_release"),
-        "Performance Comparison": TestConfig("package_release"),
-        "Performance Comparison Aarch64": TestConfig("package_aarch64"),
-        "SQLancer (release)": TestConfig("package_release"),
-        "SQLancer (debug)": TestConfig("package_debug"),
-        "Sqllogic test (release)": TestConfig("package_release"),
-        "SQLTest": TestConfig("package_release"),
-        "libFuzzer tests": TestConfig("fuzzers"),
+        "Performance Comparison": TestConfig(
+            "package_release",
+            job_config=JobConfig(num_batches=4, **perf_test_common_params),  # type: ignore
+        ),
+        "Performance Comparison Aarch64": TestConfig(
+            "package_aarch64",
+            job_config=JobConfig(num_batches=4, run_by_label="pr-performance", **perf_test_common_params),  # type: ignore
+        ),
+        "SQLancer (release)": TestConfig(
+            "package_release", job_config=JobConfig(**sqllancer_test_common_params)  # type: ignore
+        ),
+        "SQLancer (debug)": TestConfig(
+            "package_debug", job_config=JobConfig(**sqllancer_test_common_params)  # type: ignore
+        ),
+        "Sqllogic test (release)": TestConfig(
+            "package_release", job_config=JobConfig(**sqllogic_test_params)  # type: ignore
+        ),
+        "SQLTest": TestConfig(
+            "package_release", job_config=JobConfig(**sql_test_params)  # type: ignore
+        ),
+        "ClickBench (amd64)": TestConfig("package_release"),
+        "ClickBench (aarch64)": TestConfig("package_aarch64"),
+        # FIXME: add digest and params
+        "libFuzzer tests": TestConfig("fuzzers"),  # type: ignore
     },
 )
 CI_CONFIG.validate()
@@ -329,6 +848,7 @@ CI_CONFIG.validate()
 
 # checks required by Mergeable Check
 REQUIRED_CHECKS = [
+    "PR Check",
     "ClickHouse build check",
     "ClickHouse special build check",
     "Docs Check",
@@ -499,6 +1019,11 @@ CHECK_DESCRIPTIONS = [
         "successfully startup without any errors, crashes or sanitizer asserts",
         lambda x: x.startswith("Upgrade check ("),
     ),
+    CheckDescription(
+        "ClickBench",
+        "Runs [ClickBench](https://github.com/ClickHouse/ClickBench/) with instant-attach table",
+        lambda x: x.startswith("ClickBench"),
+    ),
     CheckDescription(
         "Falback for unknown",
         "There's no description for the check yet, please add it to "
diff --git a/tests/ci/clickbench.py b/tests/ci/clickbench.py
new file mode 100644
index 00000000000..f9fadae4e03
--- /dev/null
+++ b/tests/ci/clickbench.py
@@ -0,0 +1,231 @@
+#!/usr/bin/env python3
+
+import argparse
+import csv
+import logging
+import os
+import subprocess
+import sys
+import atexit
+from pathlib import Path
+from typing import List, Tuple
+
+from github import Github
+
+from build_download_helper import download_all_deb_packages
+from clickhouse_helper import (
+    CiLogsCredentials,
+    ClickHouseHelper,
+    prepare_tests_results_for_clickhouse,
+)
+from commit_status_helper import (
+    RerunHelper,
+    get_commit,
+    override_status,
+    post_commit_status,
+    update_mergeable_check,
+)
+from docker_images_helper import get_docker_image, pull_image, DockerImage
+from env_helper import TEMP_PATH, REPORT_PATH
+from get_robot_token import get_best_robot_token
+from pr_info import FORCE_TESTS_LABEL, PRInfo
+from s3_helper import S3Helper
+from stopwatch import Stopwatch
+from tee_popen import TeePopen
+from upload_result_helper import upload_results
+from report import TestResults
+
+
+def get_image_name() -> str:
+    return "clickhouse/clickbench"
+
+
+def get_run_command(
+    builds_path: Path,
+    result_path: Path,
+    server_log_path: Path,
+    additional_envs: List[str],
+    ci_logs_args: str,
+    image: DockerImage,
+) -> str:
+    envs = [f"-e {e}" for e in additional_envs]
+
+    env_str = " ".join(envs)
+
+    return (
+        f"docker run --shm-size=16g --volume={builds_path}:/package_folder "
+        f"{ci_logs_args}"
+        f"--volume={result_path}:/test_output "
+        f"--volume={server_log_path}:/var/log/clickhouse-server "
+        f"--cap-add=SYS_PTRACE {env_str} {image}"
+    )
+
+
+def process_results(
+    result_directory: Path,
+    server_log_path: Path,
+) -> Tuple[str, str, TestResults, List[Path]]:
+    test_results = []  # type: TestResults
+    additional_files = []  # type: List[Path]
+    # Just upload all files from result_directory.
+    # If task provides processed results, then it's responsible for content of result_directory.
+    if result_directory.exists():
+        additional_files = [p for p in result_directory.iterdir() if p.is_file()]
+
+    if server_log_path.exists():
+        additional_files = additional_files + [
+            p for p in server_log_path.iterdir() if p.is_file()
+        ]
+
+    status = []
+    status_path = result_directory / "check_status.tsv"
+    if status_path.exists():
+        logging.info("Found check_status.tsv")
+        with open(status_path, "r", encoding="utf-8") as status_file:
+            status = list(csv.reader(status_file, delimiter="\t"))
+
+    if len(status) != 1 or len(status[0]) != 2:
+        logging.info("Files in result folder %s", os.listdir(result_directory))
+        return "error", "Invalid check_status.tsv", test_results, additional_files
+    state, description = status[0][0], status[0][1]
+
+    try:
+        results_path = result_directory / "test_results.tsv"
+
+        if results_path.exists():
+            logging.info("Found %s", results_path.name)
+        else:
+            logging.info("Files in result folder %s", os.listdir(result_directory))
+            return "error", "Not found test_results.tsv", test_results, additional_files
+
+    except Exception as e:
+        return (
+            "error",
+            f"Cannot parse test_results.tsv ({e})",
+            test_results,
+            additional_files,
+        )
+
+    return state, description, test_results, additional_files
+
+
+def parse_args():
+    parser = argparse.ArgumentParser()
+    parser.add_argument("check_name")
+    return parser.parse_args()
+
+
+def main():
+    logging.basicConfig(level=logging.INFO)
+
+    stopwatch = Stopwatch()
+
+    temp_path = Path(TEMP_PATH)
+    temp_path.mkdir(parents=True, exist_ok=True)
+
+    reports_path = Path(REPORT_PATH)
+
+    args = parse_args()
+    check_name = args.check_name
+
+    gh = Github(get_best_robot_token(), per_page=100)
+
+    pr_info = PRInfo()
+
+    commit = get_commit(gh, pr_info.sha)
+    atexit.register(update_mergeable_check, commit, pr_info, check_name)
+
+    rerun_helper = RerunHelper(commit, check_name)
+    if rerun_helper.is_already_finished_by_status():
+        logging.info("Check is already finished according to github status, exiting")
+        sys.exit(0)
+
+    image_name = get_image_name()
+    docker_image = pull_image(get_docker_image(image_name))
+
+    packages_path = temp_path / "packages"
+    packages_path.mkdir(parents=True, exist_ok=True)
+
+    download_all_deb_packages(check_name, reports_path, packages_path)
+
+    server_log_path = temp_path / "server_log"
+    server_log_path.mkdir(parents=True, exist_ok=True)
+
+    result_path = temp_path / "result_path"
+    result_path.mkdir(parents=True, exist_ok=True)
+
+    run_log_path = result_path / "run.log"
+
+    additional_envs = []  # type: List[str]
+
+    ci_logs_credentials = CiLogsCredentials(temp_path / "export-logs-config.sh")
+    ci_logs_args = ci_logs_credentials.get_docker_arguments(
+        pr_info, stopwatch.start_time_str, check_name
+    )
+
+    run_command = get_run_command(
+        packages_path,
+        result_path,
+        server_log_path,
+        additional_envs,
+        ci_logs_args,
+        docker_image,
+    )
+    logging.info("Going to run ClickBench: %s", run_command)
+
+    with TeePopen(run_command, run_log_path) as process:
+        retcode = process.wait()
+        if retcode == 0:
+            logging.info("Run successfully")
+        else:
+            logging.info("Run failed")
+
+    try:
+        subprocess.check_call(f"sudo chown -R ubuntu:ubuntu {temp_path}", shell=True)
+    except subprocess.CalledProcessError:
+        logging.warning("Failed to change files owner in %s, ignoring it", temp_path)
+
+    ci_logs_credentials.clean_ci_logs_from_credentials(run_log_path)
+    s3_helper = S3Helper()
+
+    state, description, test_results, additional_logs = process_results(
+        result_path, server_log_path
+    )
+    state = override_status(state, check_name)
+
+    ch_helper = ClickHouseHelper()
+
+    report_url = upload_results(
+        s3_helper,
+        pr_info.number,
+        pr_info.sha,
+        test_results,
+        [run_log_path] + additional_logs,
+        check_name,
+    )
+
+    print(f"::notice:: {check_name} Report url: {report_url}")
+    post_commit_status(
+        commit, state, report_url, description, check_name, pr_info, dump_to_file=True
+    )
+
+    prepared_events = prepare_tests_results_for_clickhouse(
+        pr_info,
+        test_results,
+        state,
+        stopwatch.duration_seconds,
+        stopwatch.start_time_str,
+        report_url,
+        check_name,
+    )
+    ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
+
+    if state != "success":
+        if FORCE_TESTS_LABEL in pr_info.labels:
+            print(f"'{FORCE_TESTS_LABEL}' enabled, will report success")
+        else:
+            sys.exit(1)
+
+
+if __name__ == "__main__":
+    main()
diff --git a/tests/ci/commit_status_helper.py b/tests/ci/commit_status_helper.py
index 09e3478b3fc..598eef9922e 100644
--- a/tests/ci/commit_status_helper.py
+++ b/tests/ci/commit_status_helper.py
@@ -1,23 +1,24 @@
 #!/usr/bin/env python3
 
 from collections import defaultdict
+import json
 from pathlib import Path
 from typing import Dict, List, Optional, Union
 import csv
 import logging
 import time
+from dataclasses import asdict, dataclass
 
 from github import Github
 from github.Commit import Commit
 from github.CommitStatus import CommitStatus
 from github.GithubException import GithubException
-from github.GithubObject import _NotSetType, NotSet as NotSet
+from github.GithubObject import NotSet
 from github.IssueComment import IssueComment
-from github.PullRequest import PullRequest
 from github.Repository import Repository
 
 from ci_config import CI_CONFIG, REQUIRED_CHECKS, CHECK_DESCRIPTIONS, CheckDescription
-from env_helper import GITHUB_REPOSITORY, GITHUB_RUN_URL
+from env_helper import GITHUB_JOB_URL, GITHUB_REPOSITORY, TEMP_PATH
 from pr_info import PRInfo, SKIP_MERGEABLE_CHECK_LABEL
 from report import (
     ERROR,
@@ -37,6 +38,7 @@ CommitStatuses = List[CommitStatus]
 MERGEABLE_NAME = "Mergeable Check"
 GH_REPO = None  # type: Optional[Repository]
 CI_STATUS_NAME = "CI running"
+STATUS_FILE_PATH = Path(TEMP_PATH) / "status.json"
 
 
 class RerunHelper:
@@ -92,10 +94,11 @@ def get_commit(gh: Github, commit_sha: str, retry_count: int = RETRY) -> Commit:
 def post_commit_status(
     commit: Commit,
     state: str,
-    report_url: Union[_NotSetType, str] = NotSet,
-    description: Union[_NotSetType, str] = NotSet,
-    check_name: Union[_NotSetType, str] = NotSet,
+    report_url: Optional[str] = None,
+    description: Optional[str] = None,
+    check_name: Optional[str] = None,
     pr_info: Optional[PRInfo] = None,
+    dump_to_file: bool = False,
 ) -> None:
     """The parameters are given in the same order as for commit.create_status,
     if an optional parameter `pr_info` is given, the `set_status_comment` functions
@@ -104,9 +107,9 @@ def post_commit_status(
         try:
             commit.create_status(
                 state=state,
-                target_url=report_url,
-                description=description,
-                context=check_name,
+                target_url=report_url if report_url is not None else NotSet,
+                description=description if description is not None else NotSet,
+                context=check_name if check_name is not None else NotSet,
             )
             break
         except Exception as ex:
@@ -129,6 +132,15 @@ def post_commit_status(
 
         if not status_updated:
             logging.error("Failed to update the status comment, continue anyway")
+    if dump_to_file:
+        assert pr_info
+        CommitStatusData(
+            status=state,
+            description=description or "",
+            report_url=report_url or "",
+            sha=pr_info.sha,
+            pr_num=pr_info.number,
+        ).dump_status()
 
 
 STATUS_ICON_MAP = defaultdict(
@@ -309,6 +321,55 @@ def post_commit_status_to_file(
         out.writerow([state, report_url, description])
 
 
+@dataclass
+class CommitStatusData:
+    """
+    if u about to add/remove fields in this class be causious that it dumps/loads to/from files (see it's method)
+    - you might want to add default values for new fields so that it won't break with old files
+    """
+
+    status: str
+    report_url: str
+    description: str
+    sha: str = "deadbeaf"
+    pr_num: int = -1
+
+    @classmethod
+    def _filter_dict(cls, data: dict) -> Dict:
+        return {k: v for k, v in data.items() if k in cls.__annotations__.keys()}
+
+    @classmethod
+    def load_from_file(cls, file_path: Union[Path, str]):  # type: ignore
+        res = {}
+        with open(file_path, "r") as json_file:
+            res = json.load(json_file)
+        return CommitStatusData(**cls._filter_dict(res))
+
+    @classmethod
+    def load_status(cls):  # type: ignore
+        return cls.load_from_file(STATUS_FILE_PATH)
+
+    @classmethod
+    def is_present(cls) -> bool:
+        return STATUS_FILE_PATH.is_file()
+
+    def dump_status(self) -> None:
+        STATUS_FILE_PATH.parent.mkdir(parents=True, exist_ok=True)
+        self.dump_to_file(STATUS_FILE_PATH)
+
+    def dump_to_file(self, file_path: Union[Path, str]) -> None:
+        file_path = Path(file_path) or STATUS_FILE_PATH
+        with open(file_path, "w") as json_file:
+            json.dump(asdict(self), json_file)
+
+    def is_ok(self):
+        return self.status == SUCCESS
+
+    @staticmethod
+    def cleanup():
+        STATUS_FILE_PATH.unlink(missing_ok=True)
+
+
 def get_commit_filtered_statuses(commit: Commit) -> CommitStatuses:
     """
     Squash statuses to latest state
@@ -375,11 +436,11 @@ def set_mergeable_check(
         context=MERGEABLE_NAME,
         description=description,
         state=state,
-        target_url=GITHUB_RUN_URL,
+        target_url=GITHUB_JOB_URL(),
     )
 
 
-def update_mergeable_check(gh: Github, pr_info: PRInfo, check_name: str) -> None:
+def update_mergeable_check(commit: Commit, pr_info: PRInfo, check_name: str) -> None:
     not_run = (
         pr_info.labels.intersection({SKIP_MERGEABLE_CHECK_LABEL, "release"})
         or check_name not in REQUIRED_CHECKS
@@ -392,7 +453,6 @@ def update_mergeable_check(gh: Github, pr_info: PRInfo, check_name: str) -> None
 
     logging.info("Update Mergeable Check by %s", check_name)
 
-    commit = get_commit(gh, pr_info.sha)
     statuses = get_commit_filtered_statuses(commit)
 
     required_checks = [
@@ -413,14 +473,17 @@ def update_mergeable_check(gh: Github, pr_info: PRInfo, check_name: str) -> None
         else:
             fail.append(status.context)
 
+    state: StatusType = SUCCESS
+
+    if success:
+        description = ", ".join(success)
+    else:
+        description = "awaiting job statuses"
+
     if fail:
         description = "failed: " + ", ".join(fail)
-        description = format_description(description)
-        if mergeable_status is None or mergeable_status.description != description:
-            set_mergeable_check(commit, description, FAILURE)
-        return
-
-    description = ", ".join(success)
+        state = FAILURE
     description = format_description(description)
+
     if mergeable_status is None or mergeable_status.description != description:
-        set_mergeable_check(commit, description)
+        set_mergeable_check(commit, description, state)
diff --git a/tests/ci/compatibility_check.py b/tests/ci/compatibility_check.py
index 8f6d4917efe..e3da81a54ad 100644
--- a/tests/ci/compatibility_check.py
+++ b/tests/ci/compatibility_check.py
@@ -16,8 +16,8 @@ from clickhouse_helper import (
     prepare_tests_results_for_clickhouse,
 )
 from commit_status_helper import RerunHelper, get_commit, post_commit_status
-from docker_pull_helper import get_images_with_versions, DockerImage
-from env_helper import TEMP_PATH, REPORTS_PATH
+from docker_images_helper import DockerImage, get_docker_image, pull_image
+from env_helper import TEMP_PATH, REPORT_PATH
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResults, TestResult
@@ -145,8 +145,9 @@ def main():
     stopwatch = Stopwatch()
 
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
-    reports_path = Path(REPORTS_PATH)
+    reports_path.mkdir(parents=True, exist_ok=True)
 
     pr_info = PRInfo()
 
@@ -187,15 +188,14 @@ def main():
         run_commands.extend(check_glibc_commands)
 
     if args.check_distributions:
-        docker_images = get_images_with_versions(
-            reports_path, [IMAGE_CENTOS, IMAGE_UBUNTU]
-        )
+        centos_image = pull_image(get_docker_image(IMAGE_CENTOS))
+        ubuntu_image = pull_image(get_docker_image(IMAGE_UBUNTU))
         check_distributions_commands = get_run_commands_distributions(
             packages_path,
             result_path,
             server_log_path,
-            docker_images[0],
-            docker_images[1],
+            centos_image,
+            ubuntu_image,
         )
         run_commands.extend(check_distributions_commands)
 
@@ -239,7 +239,15 @@ def main():
         args.check_name,
     )
     print(f"::notice ::Report url: {report_url}")
-    post_commit_status(commit, state, report_url, description, args.check_name, pr_info)
+    post_commit_status(
+        commit,
+        state,
+        report_url,
+        description,
+        args.check_name,
+        pr_info,
+        dump_to_file=True,
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/digest_helper.py b/tests/ci/digest_helper.py
index 543de51e46b..c0cbae13a45 100644
--- a/tests/ci/digest_helper.py
+++ b/tests/ci/digest_helper.py
@@ -1,11 +1,20 @@
 #!/usr/bin/env python3
 
+import bisect
+from dataclasses import asdict
 from hashlib import md5
 from logging import getLogger
 from pathlib import Path
-from typing import TYPE_CHECKING, Iterable, Optional
+from typing import TYPE_CHECKING, Dict, Iterable, List, Optional, Union
 from sys import modules
 
+from docker_images_helper import get_images_info
+from ci_config import DigestConfig
+from git_helper import Runner
+
+DOCKER_DIGEST_LEN = 12
+JOB_DIGEST_LEN = 10
+
 if TYPE_CHECKING:
     from hashlib import (  # pylint:disable=no-name-in-module,ungrouped-imports
         _Hash as HASH,
@@ -23,46 +32,55 @@ def _digest_file(file: Path, hash_object: HASH) -> None:
             hash_object.update(chunk)
 
 
-def _digest_directory(directory: Path, hash_object: HASH) -> None:
-    assert directory.is_dir()
-    for p in sorted(directory.rglob("*")):
-        if p.is_symlink() and p.is_dir():
-            # The symlink directory is not listed recursively, so we process it manually
-            (_digest_directory(p, hash_object))
-        if p.is_file():
-            (_digest_file(p, hash_object))
-
-
-def digest_path(path: Path, hash_object: Optional[HASH] = None) -> HASH:
+def digest_path(
+    path: Union[Path, str],
+    hash_object: Optional[HASH] = None,
+    exclude_files: Optional[Iterable[str]] = None,
+    exclude_dirs: Optional[Iterable[Union[Path, str]]] = None,
+) -> HASH:
     """Calculates md5 (or updates existing hash_object) hash of the path, either it's
-    directory or file"""
+    directory or file
+    @exclude_files - file extension(s) or any filename suffix(es) that you want to exclude from digest
+    @exclude_dirs - dir names that you want to exclude from digest
+    """
+    path = Path(path)
     hash_object = hash_object or md5()
-    if path.is_dir():
-        _digest_directory(path, hash_object)
-    elif path.is_file():
-        _digest_file(path, hash_object)
+    if path.is_file():
+        if not exclude_files or not any(path.name.endswith(x) for x in exclude_files):
+            _digest_file(path, hash_object)
+    elif path.is_dir():
+        if not exclude_dirs or not any(path.name == x for x in exclude_dirs):
+            for p in sorted(path.iterdir()):
+                digest_path(p, hash_object, exclude_files, exclude_dirs)
+    else:
+        pass  # broken symlink
     return hash_object
 
 
-def digest_paths(paths: Iterable[Path], hash_object: Optional[HASH] = None) -> HASH:
+def digest_paths(
+    paths: Iterable[Union[Path, str]],
+    hash_object: Optional[HASH] = None,
+    exclude_files: Optional[Iterable[str]] = None,
+    exclude_dirs: Optional[Iterable[Union[Path, str]]] = None,
+) -> HASH:
     """Calculates aggregated md5 (or updates existing hash_object) hash of passed paths.
     The order is processed as given"""
     hash_object = hash_object or md5()
-    for path in paths:
+    paths_all: List[Path] = []
+    for p in paths:
+        if isinstance(p, str) and "*" in p:
+            for path in Path(".").glob(p):
+                bisect.insort(paths_all, path.absolute())  # type: ignore[misc]
+        else:
+            bisect.insort(paths_all, Path(p).absolute())  # type: ignore[misc]
+    for path in paths_all:  # type: ignore
         if path.exists():
-            digest_path(path, hash_object)
+            digest_path(path, hash_object, exclude_files, exclude_dirs)
+        else:
+            raise AssertionError(f"Invalid path: {path}")
     return hash_object
 
 
-def digest_consistent_paths(
-    paths: Iterable[Path], hash_object: Optional[HASH] = None
-) -> HASH:
-    """Calculates aggregated md5 (or updates existing hash_object) hash of passed paths.
-    The order doesn't matter, paths are converted to `absolute` and ordered before
-    calculation"""
-    return digest_paths(sorted(p.absolute() for p in paths), hash_object)
-
-
 def digest_script(path_str: str) -> HASH:
     """Accepts value of the __file__ executed script and calculates the md5 hash for it"""
     path = Path(path_str)
@@ -78,3 +96,85 @@ def digest_script(path_str: str) -> HASH:
         logger.warning("The modules size has changed, retry calculating digest")
         return digest_script(path_str)
     return md5_hash
+
+
+def digest_string(string: str) -> str:
+    hash_object = md5()
+    hash_object.update(string.encode("utf-8"))
+    return hash_object.hexdigest()
+
+
+class DockerDigester:
+    EXCLUDE_FILES = [".md"]
+
+    def __init__(self):
+        self.images_info = get_images_info()
+        assert self.images_info, "Fetch image info error"
+
+    def get_image_digest(self, name: str) -> str:
+        assert isinstance(name, str)
+        deps = [name]
+        digest = None
+        while deps:
+            dep_name = deps.pop(0)
+            digest = digest_path(
+                self.images_info[dep_name]["path"],
+                digest,
+                exclude_files=self.EXCLUDE_FILES,
+            )
+            deps += self.images_info[dep_name]["deps"]
+        assert digest
+        return digest.hexdigest()[0:DOCKER_DIGEST_LEN]
+
+    def get_all_digests(self) -> Dict:
+        res = {}
+        for image_name in self.images_info:
+            res[image_name] = self.get_image_digest(image_name)
+        return res
+
+
+class JobDigester:
+    def __init__(self):
+        self.dd = DockerDigester()
+        self.cache: Dict[str, str] = {}
+
+    @staticmethod
+    def _get_config_hash(digest_config: DigestConfig) -> str:
+        data_dict = asdict(digest_config)
+        hash_obj = md5()
+        hash_obj.update(str(data_dict).encode())
+        hash_string = hash_obj.hexdigest()
+        return hash_string
+
+    def get_job_digest(self, digest_config: DigestConfig) -> str:
+        if not digest_config.include_paths:
+            # job is not for digest
+            return "f" * JOB_DIGEST_LEN
+
+        cache_key = self._get_config_hash(digest_config)
+        if cache_key in self.cache:
+            return self.cache[cache_key]
+
+        digest_str: List[str] = []
+        if digest_config.include_paths:
+            digest = digest_paths(
+                digest_config.include_paths,
+                hash_object=None,
+                exclude_files=digest_config.exclude_files,
+                exclude_dirs=digest_config.exclude_dirs,
+            )
+            digest_str += (digest.hexdigest(),)
+        if digest_config.docker:
+            for image_name in digest_config.docker:
+                image_digest = self.dd.get_image_digest(image_name)
+                digest_str += (image_digest,)
+        if digest_config.git_submodules:
+            submodules_sha = Runner().run(
+                "git submodule | awk '{print $1}' | sed 's/^[+-]//'"
+            )
+            assert submodules_sha and len(submodules_sha) > 10
+            submodules_digest = digest_string("-".join(submodules_sha))
+            digest_str += (submodules_digest,)
+        res = digest_string("-".join(digest_str))[0:JOB_DIGEST_LEN]
+        self.cache[cache_key] = res
+        return res
diff --git a/tests/ci/docker_images_check.py b/tests/ci/docker_images_check.py
index 274d0d1d1df..ae6e81c4c9f 100644
--- a/tests/ci/docker_images_check.py
+++ b/tests/ci/docker_images_check.py
@@ -2,210 +2,43 @@
 import argparse
 import json
 import logging
-import platform
-import subprocess
+import os
 import time
 import sys
 from pathlib import Path
-from typing import Any, List, Optional, Set, Tuple, Union
+from typing import List, Optional, Tuple
 
 from github import Github
 
 from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
 from commit_status_helper import format_description, get_commit, post_commit_status
-from env_helper import REPO_COPY, RUNNER_TEMP, GITHUB_RUN_URL
-from get_robot_token import get_best_robot_token, get_parameter_from_ssm
+from env_helper import ROOT_DIR, RUNNER_TEMP, GITHUB_RUN_URL
+from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResults, TestResult
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
 from upload_result_helper import upload_results
-from docker_images_helper import ImagesDict, IMAGES_FILE_PATH, get_images_dict
+from docker_images_helper import DockerImageData, docker_login, get_images_oredered_list
 
 NAME = "Push to Dockerhub"
 TEMP_PATH = Path(RUNNER_TEMP) / "docker_images_check"
 TEMP_PATH.mkdir(parents=True, exist_ok=True)
 
 
-class DockerImage:
-    def __init__(
-        self,
-        path: str,
-        repo: str,
-        only_amd64: bool,
-        parent: Optional["DockerImage"] = None,
-        gh_repo: str = REPO_COPY,
-    ):
-        assert not path.startswith("/")
-        self.path = path
-        self.full_path = Path(gh_repo) / path
-        self.repo = repo
-        self.only_amd64 = only_amd64
-        self.parent = parent
-        self.built = False
-
-    def __eq__(self, other) -> bool:  # type: ignore
-        """Is used to check if DockerImage is in a set or not"""
-        return (
-            self.path == other.path
-            and self.repo == self.repo
-            and self.only_amd64 == other.only_amd64
-        )
-
-    def __lt__(self, other: Any) -> bool:
-        if not isinstance(other, DockerImage):
-            return False
-        if self.parent and not other.parent:
-            return False
-        if not self.parent and other.parent:
-            return True
-        if self.path < other.path:
-            return True
-        if self.repo < other.repo:
-            return True
-        return False
-
-    def __hash__(self):
-        return hash(self.path)
-
-    def __str__(self):
-        return self.repo
-
-    def __repr__(self):
-        return f"DockerImage(path={self.path},repo={self.repo},parent={self.parent})"
-
-
-def get_changed_docker_images(
-    pr_info: PRInfo, images_dict: ImagesDict
-) -> Set[DockerImage]:
-    if not images_dict:
-        return set()
-
-    files_changed = pr_info.changed_files
-
-    logging.info(
-        "Changed files for PR %s @ %s: %s",
-        pr_info.number,
-        pr_info.sha,
-        str(files_changed),
-    )
-
-    changed_images = []
-
-    for dockerfile_dir, image_description in images_dict.items():
-        for f in files_changed:
-            if f.startswith(dockerfile_dir):
-                name = image_description["name"]
-                only_amd64 = image_description.get("only_amd64", False)
-                logging.info(
-                    "Found changed file '%s' which affects "
-                    "docker image '%s' with path '%s'",
-                    f,
-                    name,
-                    dockerfile_dir,
-                )
-                changed_images.append(DockerImage(dockerfile_dir, name, only_amd64))
-                break
-
-    # The order is important: dependents should go later than bases, so that
-    # they are built with updated base versions.
-    index = 0
-    while index < len(changed_images):
-        image = changed_images[index]
-        for dependent in images_dict[image.path]["dependent"]:
-            logging.info(
-                "Marking docker image '%s' as changed because it "
-                "depends on changed docker image '%s'",
-                dependent,
-                image,
-            )
-            name = images_dict[dependent]["name"]
-            only_amd64 = images_dict[dependent].get("only_amd64", False)
-            changed_images.append(DockerImage(dependent, name, only_amd64, image))
-        index += 1
-        if index > 5 * len(images_dict):
-            # Sanity check to prevent infinite loop.
-            raise RuntimeError(
-                f"Too many changed docker images, this is a bug. {changed_images}"
-            )
-
-    # With reversed changed_images set will use images with parents first, and
-    # images without parents then
-    result = set(reversed(changed_images))
-    logging.info(
-        "Changed docker images for PR %s @ %s: '%s'",
-        pr_info.number,
-        pr_info.sha,
-        result,
-    )
-    return result
-
-
-def gen_versions(
-    pr_info: PRInfo, suffix: Optional[str]
-) -> Tuple[List[str], Union[str, List[str]]]:
-    pr_commit_version = str(pr_info.number) + "-" + pr_info.sha
-    # The order is important, PR number is used as cache during the build
-    versions = [str(pr_info.number), pr_commit_version]
-    result_version = pr_commit_version  # type: Union[str, List[str]]
-    if pr_info.number == 0 and pr_info.base_ref == "master":
-        # First get the latest for cache
-        versions.insert(0, "latest")
-
-    if suffix:
-        # We should build architecture specific images separately and merge a
-        # manifest lately in a different script
-        versions = [f"{v}-{suffix}" for v in versions]
-        # changed_images_{suffix}.json should contain all changed images
-        result_version = versions
-
-    return versions, result_version
-
-
-def build_and_push_dummy_image(
-    image: DockerImage,
-    version_string: str,
-    push: bool,
-) -> Tuple[bool, Path]:
-    dummy_source = "ubuntu:20.04"
-    logging.info("Building docker image %s as %s", image.repo, dummy_source)
-    build_log = (
-        Path(TEMP_PATH)
-        / f"build_and_push_log_{image.repo.replace('/', '_')}_{version_string}.log"
-    )
-    cmd = (
-        f"docker pull {dummy_source}; "
-        f"docker tag {dummy_source} {image.repo}:{version_string}; "
-    )
-    if push:
-        cmd += f"docker push {image.repo}:{version_string}"
-
-    logging.info("Docker command to run: %s", cmd)
-    with TeePopen(cmd, build_log) as proc:
-        retcode = proc.wait()
-
-    if retcode != 0:
-        return False, build_log
-
-    logging.info("Processing of %s successfully finished", image.repo)
-    return True, build_log
-
-
 def build_and_push_one_image(
-    image: DockerImage,
+    image: DockerImageData,
     version_string: str,
     additional_cache: List[str],
     push: bool,
-    child: bool,
+    from_tag: Optional[str] = None,
 ) -> Tuple[bool, Path]:
-    if image.only_amd64 and platform.machine() not in ["amd64", "x86_64"]:
-        return build_and_push_dummy_image(image, version_string, push)
     logging.info(
         "Building docker image %s with version %s from path %s",
         image.repo,
         version_string,
-        image.full_path,
+        image.path,
     )
     build_log = (
         Path(TEMP_PATH)
@@ -216,8 +49,8 @@ def build_and_push_one_image(
         push_arg = "--push "
 
     from_tag_arg = ""
-    if child:
-        from_tag_arg = f"--build-arg FROM_TAG={version_string} "
+    if from_tag:
+        from_tag_arg = f"--build-arg FROM_TAG={from_tag} "
 
     cache_from = (
         f"--cache-from type=registry,ref={image.repo}:{version_string} "
@@ -237,7 +70,7 @@ def build_and_push_one_image(
         f"{cache_from} "
         f"--cache-to type=inline,mode=max "
         f"{push_arg}"
-        f"--progress plain {image.full_path}"
+        f"--progress plain {image.path}"
     )
     logging.info("Docker command to run: %s", cmd)
     with TeePopen(cmd, build_log) as proc:
@@ -251,11 +84,11 @@ def build_and_push_one_image(
 
 
 def process_single_image(
-    image: DockerImage,
+    image: DockerImageData,
     versions: List[str],
     additional_cache: List[str],
     push: bool,
-    child: bool,
+    from_tag: Optional[str] = None,
 ) -> TestResults:
     logging.info("Image will be pushed with versions %s", ", ".join(versions))
     results = []  # type: TestResults
@@ -263,7 +96,7 @@ def process_single_image(
         stopwatch = Stopwatch()
         for i in range(5):
             success, build_log = build_and_push_one_image(
-                image, ver, additional_cache, push, child
+                image, ver, additional_cache, push, from_tag
             )
             if success:
                 results.append(
@@ -294,27 +127,6 @@ def process_single_image(
     return results
 
 
-def process_image_with_parents(
-    image: DockerImage,
-    versions: List[str],
-    additional_cache: List[str],
-    push: bool,
-    child: bool = False,
-) -> TestResults:
-    results = []  # type: TestResults
-    if image.built:
-        return results
-
-    if image.parent is not None:
-        results += process_image_with_parents(
-            image.parent, versions, additional_cache, push, False
-        )
-        child = True
-
-    results += process_single_image(image, versions, additional_cache, push, child)
-    return results
-
-
 def parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser(
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
@@ -324,30 +136,18 @@ def parse_args() -> argparse.Namespace:
         "--image-path docker/packager/binary",
     )
 
+    parser.add_argument("--suffix", type=str, required=True, help="arch suffix")
     parser.add_argument(
-        "--suffix",
+        "--missing-images",
         type=str,
-        help="suffix for all built images tags and resulting json file; the parameter "
-        "significantly changes the script behavior, e.g. changed_images.json is called "
-        "changed_images_{suffix}.json and contains list of all tags",
+        required=True,
+        help="json string or json file with images to build {IMAGE: TAG} or type all to build all",
     )
     parser.add_argument(
-        "--repo",
+        "--image-tags",
         type=str,
-        default="clickhouse",
-        help="docker hub repository prefix",
-    )
-    parser.add_argument(
-        "--all",
-        action="store_true",
-        help="rebuild all images",
-    )
-    parser.add_argument(
-        "--image-path",
-        type=str,
-        nargs="*",
-        help="list of image paths to build instead of using pr_info + diff URL, "
-        "e.g. 'docker/packager/binary'",
+        required=True,
+        help="json string or json file with all images and their tags {IMAGE: TAG}",
     )
     parser.add_argument("--reports", default=True, help=argparse.SUPPRESS)
     parser.add_argument(
@@ -370,82 +170,81 @@ def parse_args() -> argparse.Namespace:
 
 
 def main():
+    # to be always aligned with docker paths from image.json
+    os.chdir(ROOT_DIR)
     logging.basicConfig(level=logging.INFO)
     stopwatch = Stopwatch()
 
     args = parse_args()
-    if args.suffix:
-        global NAME
-        NAME += f" {args.suffix}"
-        changed_json = TEMP_PATH / f"changed_images_{args.suffix}.json"
-    else:
-        changed_json = TEMP_PATH / "changed_images.json"
-
     if args.push:
-        subprocess.check_output(  # pylint: disable=unexpected-keyword-arg
-            "docker login --username 'robotclickhouse' --password-stdin",
-            input=get_parameter_from_ssm("dockerhub_robot_password"),
-            encoding="utf-8",
-            shell=True,
-        )
+        logging.info("login to docker hub")
+        docker_login()
 
-    images_dict = get_images_dict(Path(REPO_COPY), IMAGES_FILE_PATH)
-
-    pr_info = PRInfo()
-    if args.all:
-        pr_info.changed_files = set(images_dict.keys())
-    elif args.image_path:
-        pr_info.changed_files = set(i for i in args.image_path)
-    else:
-        try:
-            pr_info.fetch_changed_files()
-        except TypeError:
-            # If the event does not contain diff, nothing will be built
-            pass
-
-    changed_images = get_changed_docker_images(pr_info, images_dict)
-    if changed_images:
-        logging.info(
-            "Has changed images: %s", ", ".join([im.path for im in changed_images])
-        )
-
-    image_versions, result_version = gen_versions(pr_info, args.suffix)
-
-    result_images = {}
     test_results = []  # type: TestResults
     additional_cache = []  # type: List[str]
-    if pr_info.release_pr:
-        logging.info("Use %s as additional cache tag", pr_info.release_pr)
-        additional_cache.append(str(pr_info.release_pr))
-    if pr_info.merged_pr:
-        logging.info("Use %s as additional cache tag", pr_info.merged_pr)
-        additional_cache.append(str(pr_info.merged_pr))
+    # FIXME: add all tags taht we need. latest on master!
+    # if pr_info.release_pr:
+    #     logging.info("Use %s as additional cache tag", pr_info.release_pr)
+    #     additional_cache.append(str(pr_info.release_pr))
+    # if pr_info.merged_pr:
+    #     logging.info("Use %s as additional cache tag", pr_info.merged_pr)
+    #     additional_cache.append(str(pr_info.merged_pr))
 
-    for image in changed_images:
-        # If we are in backport PR, then pr_info.release_pr is defined
-        # We use it as tag to reduce rebuilding time
-        test_results += process_image_with_parents(
-            image, image_versions, additional_cache, args.push
+    ok_cnt = 0
+    status = "success"
+    image_tags = (
+        json.loads(args.image_tags)
+        if not os.path.isfile(args.image_tags)
+        else json.load(open(args.image_tags))
+    )
+    missing_images = (
+        image_tags
+        if args.missing_images == "all"
+        else json.loads(args.missing_images)
+        if not os.path.isfile(args.missing_images)
+        else json.load(open(args.missing_images))
+    )
+    images_build_list = get_images_oredered_list()
+
+    for image in images_build_list:
+        if image.repo not in missing_images:
+            continue
+        logging.info("Start building image: %s", image)
+
+        image_versions = (
+            [image_tags[image.repo]]
+            if not args.suffix
+            else [f"{image_tags[image.repo]}-{args.suffix}"]
+        )
+        parent_version = (
+            None
+            if not image.parent
+            else image_tags[image.parent]
+            if not args.suffix
+            else f"{image_tags[image.parent]}-{args.suffix}"
         )
-        result_images[image.repo] = result_version
 
-    if changed_images:
-        description = "Updated " + ",".join([im.repo for im in changed_images])
-    else:
-        description = "Nothing to update"
+        res = process_single_image(
+            image,
+            image_versions,
+            additional_cache,
+            args.push,
+            from_tag=parent_version,
+        )
+        test_results += res
+        if all(x.status == "OK" for x in res):
+            ok_cnt += 1
+        else:
+            status = "failure"
+            break  # No need to continue with next images
 
-    description = format_description(description)
-
-    with open(changed_json, "w", encoding="utf-8") as images_file:
-        logging.info("Saving changed images file %s", changed_json)
-        json.dump(result_images, images_file)
+    description = format_description(
+        f"Images build done. built {ok_cnt} out of {len(missing_images)} images."
+    )
 
     s3_helper = S3Helper()
 
-    status = "success"
-    if [r for r in test_results if r.status != "OK"]:
-        status = "failure"
-
+    pr_info = PRInfo()
     url = upload_results(s3_helper, pr_info.number, pr_info.sha, test_results, [], NAME)
 
     print(f"::notice ::Report url: {url}")
@@ -455,7 +254,9 @@ def main():
 
     gh = Github(get_best_robot_token(), per_page=100)
     commit = get_commit(gh, pr_info.sha)
-    post_commit_status(commit, status, url, description, NAME, pr_info)
+    post_commit_status(
+        commit, status, url, description, NAME, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/docker_images_helper.py b/tests/ci/docker_images_helper.py
index b12f7fe037e..6ea679e0597 100644
--- a/tests/ci/docker_images_helper.py
+++ b/tests/ci/docker_images_helper.py
@@ -2,19 +2,136 @@
 
 import json
 import logging
+import os
+import subprocess
 from pathlib import Path
-from typing import Dict, List
+from typing import Any, Dict, List, Optional
+
+from env_helper import ROOT_DIR, DOCKER_TAG
+from get_robot_token import get_parameter_from_ssm
 
 IMAGES_FILE_PATH = Path("docker/images.json")
 
 ImagesDict = Dict[str, dict]
 
 
-def get_images_dict(repo_path: Path, images_file_path: Path) -> ImagesDict:
+def docker_login(relogin: bool = True) -> None:
+    if (
+        relogin
+        or subprocess.run(  # pylint: disable=unexpected-keyword-arg
+            "docker system info | grep --quiet -E 'Username|Registry'",
+            shell=True,
+            check=False,
+        ).returncode
+        == 1
+    ):
+        subprocess.check_output(  # pylint: disable=unexpected-keyword-arg
+            "docker login --username 'robotclickhouse' --password-stdin",
+            input=get_parameter_from_ssm("dockerhub_robot_password"),
+            encoding="utf-8",
+            shell=True,
+        )
+
+
+class DockerImage:
+    def __init__(self, name: str, version: Optional[str] = None):
+        self.name = name
+        if version is None:
+            self.version = "latest"
+        else:
+            self.version = version
+
+    def __str__(self):
+        return f"{self.name}:{self.version}"
+
+
+def pull_image(image: DockerImage) -> DockerImage:
+    try:
+        logging.info("Pulling image %s - start", image)
+        subprocess.check_output(
+            f"docker pull {image}",
+            stderr=subprocess.STDOUT,
+            shell=True,
+        )
+        logging.info("Pulling image %s - done", image)
+    except Exception as ex:
+        logging.info("Got execption pulling docker %s", ex)
+        raise ex
+    return image
+
+
+def get_docker_image(image_name: str) -> DockerImage:
+    assert DOCKER_TAG and isinstance(DOCKER_TAG, str), "DOCKER_TAG env must be provided"
+    if "{" in DOCKER_TAG:
+        tags_map = json.loads(DOCKER_TAG)
+        assert (
+            image_name in tags_map
+        ), "Image name does not exist in provided DOCKER_TAG json string"
+        return DockerImage(image_name, tags_map[image_name])
+    else:
+        # DOCKER_TAG is a tag itself
+        return DockerImage(image_name, DOCKER_TAG)
+
+
+class DockerImageData:
+    def __init__(
+        self,
+        path: str,
+        repo: str,
+        only_amd64: bool,
+        parent: Optional["DockerImageData"] = None,
+    ):
+        assert not path.startswith("/")
+        self.path = Path(ROOT_DIR) / path
+        self.repo = repo
+        self.only_amd64 = only_amd64
+        self.parent = parent
+        self.built = False
+
+    def __eq__(self, other) -> bool:  # type: ignore
+        """Is used to check if DockerImageData is in a set or not"""
+        return (
+            self.path == other.path
+            and self.repo == self.repo
+            and self.only_amd64 == other.only_amd64
+        )
+
+    def __lt__(self, other: Any) -> bool:
+        if not isinstance(other, DockerImageData):
+            return False
+        if self.parent and not other.parent:
+            return False
+        if not self.parent and other.parent:
+            return True
+        if self.path < other.path:
+            return True
+        if self.repo < other.repo:
+            return True
+        return False
+
+    def __hash__(self):
+        return hash(self.path)
+
+    def __str__(self):
+        return self.repo
+
+    def __repr__(self):
+        return (
+            f"DockerImageData(path={self.path},repo={self.repo},parent={self.parent})"
+        )
+
+
+def get_images_dict(
+    repo_path: Optional[Path] = None, images_file_path: Optional[Path] = None
+) -> ImagesDict:
     """Return images suppose to build on the current architecture host"""
     images_dict = {}
+    images_file_path = images_file_path if images_file_path else IMAGES_FILE_PATH
     assert not images_file_path.is_absolute()
-    path_to_images_file = repo_path / images_file_path
+    cur_dir = os.path.dirname(__file__)
+    path_to_images_file = (
+        repo_path if repo_path else Path(f"{cur_dir}/../..") / images_file_path
+    )
     if path_to_images_file.exists():
         with open(path_to_images_file, "rb") as dict_file:
             images_dict = json.load(dict_file)
@@ -26,6 +143,56 @@ def get_images_dict(repo_path: Path, images_file_path: Path) -> ImagesDict:
     return images_dict
 
 
-def get_image_names(repo_path: Path, images_file_path: Path) -> List[str]:
+def get_image_names(
+    repo_path: Optional[Path] = None, images_file_path: Optional[Path] = None
+) -> List[str]:
     images_dict = get_images_dict(repo_path, images_file_path)
     return [info["name"] for (_, info) in images_dict.items()]
+
+
+def get_images_info() -> Dict[str, dict]:
+    """
+    get docker info from images.json in format "image name" : image_info
+    """
+    images_dict = get_images_dict()
+    images_info: dict = {info["name"]: {"deps": []} for _, info in images_dict.items()}
+    for path, image_info_reversed in images_dict.items():
+        name = image_info_reversed["name"]
+        dependents = image_info_reversed["dependent"]
+        only_amd64 = "only_amd64" in image_info_reversed
+        images_info[name]["path"] = path
+        images_info[name]["only_amd64"] = only_amd64
+        for dep_path in dependents:
+            name_dep = images_dict[dep_path]["name"]
+            images_info[name_dep]["deps"] += [name]
+    assert len(images_dict) == len(images_info), "BUG!"
+    return images_info
+
+
+def get_images_oredered_list() -> List[DockerImageData]:
+    """
+    returns images in a sorted list so that dependents follow their dependees
+    """
+    images_info = get_images_info()
+
+    ordered_images: List[DockerImageData] = []
+    ordered_names: List[str] = []
+    while len(ordered_names) < len(images_info):
+        for name, info in images_info.items():
+            if name in ordered_names:
+                continue
+            if all(dep in ordered_names for dep in info["deps"]):
+                ordered_names += [name]
+                parents = info["deps"]
+                assert (
+                    len(parents) < 2
+                ), "FIXME: Multistage docker images are not supported in CI"
+                ordered_images += [
+                    DockerImageData(
+                        path=info["path"],
+                        repo=name,
+                        only_amd64=info["only_amd64"],
+                        parent=parents[0] if parents else None,
+                    )
+                ]
+    return ordered_images
diff --git a/tests/ci/docker_manifests_merge.py b/tests/ci/docker_manifests_merge.py
index 1be2a1f2e7a..97e7ca3b5c0 100644
--- a/tests/ci/docker_manifests_merge.py
+++ b/tests/ci/docker_manifests_merge.py
@@ -6,30 +6,26 @@ import logging
 import os
 import subprocess
 
-from pathlib import Path
-from typing import List, Dict, Tuple
+import sys
+from typing import List, Tuple
 
 from github import Github
 
 from clickhouse_helper import (
     ClickHouseHelper,
     prepare_tests_results_for_clickhouse,
-    CHException,
 )
 from commit_status_helper import format_description, get_commit, post_commit_status
-from docker_images_helper import IMAGES_FILE_PATH, get_image_names
-from env_helper import RUNNER_TEMP, REPO_COPY
-from get_robot_token import get_best_robot_token, get_parameter_from_ssm
-from git_helper import Runner
+from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
-from report import TestResults, TestResult
+from report import TestResult
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
+from env_helper import ROOT_DIR
 from upload_result_helper import upload_results
+from docker_images_helper import docker_login, get_images_oredered_list
 
 NAME = "Push multi-arch images to Dockerhub"
-CHANGED_IMAGES = "changed_images_{}.json"
-Images = Dict[str, List[str]]
 
 
 def parse_args() -> argparse.Namespace:
@@ -48,10 +44,21 @@ def parse_args() -> argparse.Namespace:
         help="suffixes for existing images' tags. More than two should be given",
     )
     parser.add_argument(
-        "--path",
-        type=Path,
-        default=RUNNER_TEMP,
-        help="path to changed_images_*.json files",
+        "--missing-images",
+        type=str,
+        required=True,
+        help="json (array) string or json file with images to create manifest for",
+    )
+    parser.add_argument(
+        "--image-tags",
+        type=str,
+        required=True,
+        help="json string or json file with all images and their tags {IMAGE: TAG}",
+    )
+    parser.add_argument(
+        "--set-latest",
+        action="store_true",
+        help="add latest tag",
     )
     parser.add_argument("--reports", default=True, help=argparse.SUPPRESS)
     parser.add_argument(
@@ -77,70 +84,13 @@ def parse_args() -> argparse.Namespace:
     return args
 
 
-def load_images(path: Path, suffix: str) -> Images:
-    with open(path / CHANGED_IMAGES.format(suffix), "rb") as images:
-        return json.load(images)  # type: ignore
-
-
-def strip_suffix(suffix: str, images: Images) -> Images:
-    result = {}
-    for image, versions in images.items():
-        for v in versions:
-            if not v.endswith(f"-{suffix}"):
-                raise ValueError(
-                    f"version {image}:{v} does not contain suffix {suffix}"
-                )
-        result[image] = [v[: -len(suffix) - 1] for v in versions]
-
-    return result
-
-
-def check_sources(to_merge: Dict[str, Images]) -> Images:
-    """get a dict {arch1: Images, arch2: Images}"""
-    result = {}  # type: Images
-    first_suffix = ""
-    for suffix, images in to_merge.items():
-        if not result:
-            first_suffix = suffix
-            result = strip_suffix(suffix, images)
-            continue
-        if not result == strip_suffix(suffix, images):
-            raise ValueError(
-                f"images in {images} are not equal to {to_merge[first_suffix]}"
-            )
-
-    return result
-
-
-def get_changed_images(images: Images) -> Dict[str, str]:
-    """The original json format is {"image": "tag"}, so the output artifact is
-    produced here. The latest version is {PR_NUMBER}-{SHA1}
-    """
-    return {k: v[-1] for k, v in images.items()}
-
-
-def merge_images(to_merge: Dict[str, Images]) -> Dict[str, List[List[str]]]:
-    """The function merges image-name:version-suffix1 and image-name:version-suffix2
-    into image-name:version"""
-    suffixes = to_merge.keys()
-    result_images = check_sources(to_merge)
-    merge = {}  # type: Dict[str, List[List[str]]]
-
-    for image, versions in result_images.items():
-        merge[image] = []
-        for i, v in enumerate(versions):
-            merged_v = [v]  # type: List[str]
-            for suf in suffixes:
-                merged_v.append(to_merge[suf][image][i])
-            merge[image].append(merged_v)
-
-    return merge
-
-
-def create_manifest(image: str, tags: List[str], push: bool) -> Tuple[str, str]:
-    tag = tags[0]
-    manifest = f"{image}:{tag}"
-    cmd = "docker manifest create --amend " + " ".join((f"{image}:{t}" for t in tags))
+def create_manifest(
+    image: str, result_tag: str, tags: List[str], push: bool
+) -> Tuple[str, str]:
+    manifest = f"{image}:{result_tag}"
+    cmd = "docker manifest create --amend " + " ".join(
+        (f"{image}:{t}" for t in [result_tag] + tags)
+    )
     logging.info("running: %s", cmd)
     with subprocess.Popen(
         cmd,
@@ -175,114 +125,59 @@ def create_manifest(image: str, tags: List[str], push: bool) -> Tuple[str, str]:
     return manifest, "OK"
 
 
-def enrich_images(changed_images: Dict[str, str]) -> None:
-    all_image_names = get_image_names(Path(REPO_COPY), IMAGES_FILE_PATH)
-
-    images_to_find_tags_for = [
-        image for image in all_image_names if image not in changed_images
-    ]
-    images_to_find_tags_for.sort()
-
-    logging.info(
-        "Trying to find versions for images:\n %s", "\n ".join(images_to_find_tags_for)
-    )
-
-    COMMIT_SHA_BATCH_SIZE = 100
-    MAX_COMMIT_BATCHES_TO_CHECK = 10
-    # Gets the sha of the last COMMIT_SHA_BATCH_SIZE commits after skipping some commits (see below)
-    LAST_N_ANCESTOR_SHA_COMMAND = f"git log --format=format:'%H' --max-count={COMMIT_SHA_BATCH_SIZE} --skip={{}} --merges"
-    git_runner = Runner()
-
-    GET_COMMIT_SHAS_QUERY = """
-        WITH {commit_shas:Array(String)} AS commit_shas,
-             {images:Array(String)} AS images
-        SELECT
-            splitByChar(':', test_name)[1] AS image_name,
-            argMax(splitByChar(':', test_name)[2], check_start_time) AS tag
-        FROM checks
-            WHERE
-                check_name == 'Push multi-arch images to Dockerhub'
-                AND position(test_name, checks.commit_sha)
-                AND checks.commit_sha IN commit_shas
-                AND image_name IN images
-        GROUP BY image_name
-        """
-
-    batch_count = 0
-    # We use always publicly available DB here intentionally
-    ch_helper = ClickHouseHelper(
-        "https://play.clickhouse.com", {"X-ClickHouse-User": "play"}
-    )
-
-    while (
-        batch_count <= MAX_COMMIT_BATCHES_TO_CHECK and len(images_to_find_tags_for) != 0
-    ):
-        commit_shas = git_runner(
-            LAST_N_ANCESTOR_SHA_COMMAND.format(batch_count * COMMIT_SHA_BATCH_SIZE)
-        ).split("\n")
-
-        result = ch_helper.select_json_each_row(
-            "default",
-            GET_COMMIT_SHAS_QUERY,
-            {"commit_shas": commit_shas, "images": images_to_find_tags_for},
-        )
-        result.sort(key=lambda x: x["image_name"])
-
-        logging.info(
-            "Found images for commits %s..%s:\n %s",
-            commit_shas[0],
-            commit_shas[-1],
-            "\n ".join(f"{im['image_name']}:{im['tag']}" for im in result),
-        )
-
-        for row in result:
-            image_name = row["image_name"]
-            changed_images[image_name] = row["tag"]
-            images_to_find_tags_for.remove(image_name)
-
-        batch_count += 1
-
-
 def main():
+    # to be aligned with docker paths from image.json
+    os.chdir(ROOT_DIR)
     logging.basicConfig(level=logging.INFO)
     stopwatch = Stopwatch()
 
     args = parse_args()
+
     if args.push:
-        subprocess.check_output(  # pylint: disable=unexpected-keyword-arg
-            "docker login --username 'robotclickhouse' --password-stdin",
-            input=get_parameter_from_ssm("dockerhub_robot_password"),
-            encoding="utf-8",
-            shell=True,
-        )
+        docker_login()
 
-    to_merge = {}
-    for suf in args.suffixes:
-        to_merge[suf] = load_images(args.path, suf)
-
-    changed_images = get_changed_images(check_sources(to_merge))
-
-    os.environ["DOCKER_CLI_EXPERIMENTAL"] = "enabled"
-    merged = merge_images(to_merge)
+    archs = args.suffixes
+    assert len(archs) > 1, "arch suffix input param is invalid"
 
+    image_tags = (
+        json.loads(args.image_tags)
+        if not os.path.isfile(args.image_tags)
+        else json.load(open(args.image_tags))
+    )
+    missing_images = (
+        list(image_tags)
+        if args.missing_images == "all"
+        else json.loads(args.missing_images)
+        if not os.path.isfile(args.missing_images)
+        else json.load(open(args.missing_images))
+    )
+    test_results = []
     status = "success"
-    test_results = []  # type: TestResults
-    for image, versions in merged.items():
-        for tags in versions:
-            manifest, test_result = create_manifest(image, tags, args.push)
+
+    ok_cnt, fail_cnt = 0, 0
+    images = get_images_oredered_list()
+    for image_obj in images:
+        if image_obj.repo not in missing_images:
+            continue
+        tag = image_tags[image_obj.repo]
+        if image_obj.only_amd64:
+            # FIXME: WA until full arm support
+            tags = [f"{tag}-{arch}" for arch in archs if arch != "aarch64"]
+        else:
+            tags = [f"{tag}-{arch}" for arch in archs]
+        manifest, test_result = create_manifest(image_obj.repo, tag, tags, args.push)
+        test_results.append(TestResult(manifest, test_result))
+        if args.set_latest:
+            manifest, test_result = create_manifest(
+                image_obj.repo, "latest", tags, args.push
+            )
             test_results.append(TestResult(manifest, test_result))
-            if test_result != "OK":
-                status = "failure"
 
-    enriched_images = changed_images.copy()
-    try:
-        # changed_images now contains all the images that are changed in this PR. Let's find the latest tag for the images that are not changed.
-        enrich_images(enriched_images)
-    except CHException as ex:
-        logging.warning("Couldn't get proper tags for not changed images: %s", ex)
-
-    with open(args.path / "changed_images.json", "w", encoding="utf-8") as ci:
-        json.dump(enriched_images, ci)
+        if test_result != "OK":
+            status = "failure"
+            fail_cnt += 1
+        else:
+            ok_cnt += 1
 
     pr_info = PRInfo()
     s3_helper = S3Helper()
@@ -294,16 +189,15 @@ def main():
     if not args.reports:
         return
 
-    if changed_images:
-        description = "Updated " + ", ".join(changed_images.keys())
-    else:
-        description = "Nothing to update"
-
-    description = format_description(description)
+    description = format_description(
+        f"Multiarch images created [ok: {ok_cnt}, failed: {fail_cnt}]"
+    )
 
     gh = Github(get_best_robot_token(), per_page=100)
     commit = get_commit(gh, pr_info.sha)
-    post_commit_status(commit, status, url, description, NAME, pr_info)
+    post_commit_status(
+        commit, status, url, description, NAME, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
@@ -316,6 +210,8 @@ def main():
     )
     ch_helper = ClickHouseHelper()
     ch_helper.insert_events_into(db="default", table="checks", events=prepared_events)
+    if status == "failure":
+        sys.exit(1)
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/docker_pull_helper.py b/tests/ci/docker_pull_helper.py
deleted file mode 100644
index e1327f505a0..00000000000
--- a/tests/ci/docker_pull_helper.py
+++ /dev/null
@@ -1,90 +0,0 @@
-#!/usr/bin/env python3
-
-import os
-import json
-import time
-import subprocess
-import logging
-
-from pathlib import Path
-from typing import List, Optional, Union
-
-
-class DockerImage:
-    def __init__(self, name: str, version: Optional[str] = None):
-        self.name = name
-        if version is None:
-            self.version = "latest"
-        else:
-            self.version = version
-
-    def __str__(self):
-        return f"{self.name}:{self.version}"
-
-
-def get_images_with_versions(
-    reports_path: Union[Path, str],
-    required_images: List[str],
-    pull: bool = True,
-    version: Optional[str] = None,
-) -> List[DockerImage]:
-    images_path = None
-    for root, _, files in os.walk(reports_path):
-        for f in files:
-            if f == "changed_images.json":
-                images_path = os.path.join(root, "changed_images.json")
-                break
-
-    if not images_path:
-        logging.info("Images file not found")
-    else:
-        logging.info("Images file path %s", images_path)
-
-    if images_path is not None and os.path.exists(images_path):
-        logging.info("Images file exists")
-        with open(images_path, "r", encoding="utf-8") as images_fd:
-            images = json.load(images_fd)
-            logging.info("Got images %s", images)
-    else:
-        images = {}
-
-    docker_images = []
-    for image_name in required_images:
-        docker_image = DockerImage(image_name, version)
-        if image_name in images:
-            docker_image.version = images[image_name]
-        docker_images.append(docker_image)
-
-    latest_error = Exception("predefined to avoid access before created")
-    if pull:
-        for docker_image in docker_images:
-            for i in range(10):
-                try:
-                    logging.info("Pulling image %s", docker_image)
-                    subprocess.check_output(
-                        f"docker pull {docker_image}",
-                        stderr=subprocess.STDOUT,
-                        shell=True,
-                    )
-                    break
-                except Exception as ex:
-                    latest_error = ex
-                    time.sleep(i * 3)
-                    logging.info("Got execption pulling docker %s", ex)
-            else:
-                raise Exception(
-                    "Cannot pull dockerhub for image docker pull "
-                    f"{docker_image} because of {latest_error}"
-                )
-
-    return docker_images
-
-
-def get_image_with_version(
-    reports_path: Union[Path, str],
-    image: str,
-    pull: bool = True,
-    version: Optional[str] = None,
-) -> DockerImage:
-    logging.info("Looking for images file in %s", reports_path)
-    return get_images_with_versions(reports_path, [image], pull, version=version)[0]
diff --git a/tests/ci/docker_server.py b/tests/ci/docker_server.py
index 55bd2983ea4..b75808890bd 100644
--- a/tests/ci/docker_server.py
+++ b/tests/ci/docker_server.py
@@ -4,27 +4,33 @@
 import argparse
 import json
 import logging
-import subprocess
 import sys
 import time
 from pathlib import Path
 from os import path as p, makedirs
-from typing import List
+from typing import Dict, List
 
 from github import Github
 
 from build_check import get_release_or_pr
 from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
 from commit_status_helper import format_description, get_commit, post_commit_status
-from docker_images_check import DockerImage
-from env_helper import CI, GITHUB_RUN_URL, RUNNER_TEMP, S3_BUILDS_BUCKET, S3_DOWNLOAD
-from get_robot_token import get_best_robot_token, get_parameter_from_ssm
+from docker_images_helper import DockerImageData, docker_login
+from env_helper import (
+    GITHUB_RUN_URL,
+    REPORT_PATH,
+    TEMP_PATH,
+    S3_BUILDS_BUCKET,
+    S3_DOWNLOAD,
+)
+from get_robot_token import get_best_robot_token
 from git_helper import Git
 from pr_info import PRInfo
 from report import TestResults, TestResult
 from s3_helper import S3Helper
 from stopwatch import Stopwatch
 from tee_popen import TeePopen
+from build_download_helper import read_build_urls
 from upload_result_helper import upload_results
 from version_helper import (
     ClickHouseVersion,
@@ -33,10 +39,10 @@ from version_helper import (
     version_arg,
 )
 
-TEMP_PATH = p.join(RUNNER_TEMP, "docker_images_check")
-BUCKETS = {"amd64": "package_release", "arm64": "package_aarch64"}
 git = Git(ignore_no_tags=True)
 
+ARCH = ("amd64", "arm64")
+
 
 class DelOS(argparse.Action):
     def __call__(self, _, namespace, __, option_string=None):
@@ -115,6 +121,11 @@ def parse_args() -> argparse.Namespace:
         default=argparse.SUPPRESS,
         help="don't build alpine image",
     )
+    parser.add_argument(
+        "--allow-build-reuse",
+        action="store_true",
+        help="allows binaries built on different branch if source digest matches current repo state",
+    )
 
     return parser.parse_args()
 
@@ -214,26 +225,29 @@ def gen_tags(version: ClickHouseVersion, release_type: str) -> List[str]:
     return tags
 
 
-def buildx_args(bucket_prefix: str, arch: str) -> List[str]:
+def buildx_args(urls: Dict[str, str], arch: str, direct_urls: List[str]) -> List[str]:
     args = [
         f"--platform=linux/{arch}",
         f"--label=build-url={GITHUB_RUN_URL}",
         f"--label=com.clickhouse.build.githash={git.sha}",
     ]
-    if bucket_prefix:
-        url = p.join(bucket_prefix, BUCKETS[arch])  # to prevent a double //
+    if direct_urls:
+        args.append(f"--build-arg=DIRECT_DOWNLOAD_URLS='{' '.join(direct_urls)}'")
+    elif urls:
+        url = urls[arch]
         args.append(f"--build-arg=REPOSITORY='{url}'")
         args.append(f"--build-arg=deb_location_url='{url}'")
     return args
 
 
 def build_and_push_image(
-    image: DockerImage,
+    image: DockerImageData,
     push: bool,
-    bucket_prefix: str,
+    repo_urls: dict[str, str],
     os: str,
     tag: str,
     version: ClickHouseVersion,
+    direct_urls: Dict[str, List[str]],
 ) -> TestResults:
     result = []  # type: TestResults
     if os != "ubuntu":
@@ -250,13 +264,19 @@ def build_and_push_image(
     # images must be built separately and merged together with `docker manifest`
     digests = []
     multiplatform_sw = Stopwatch()
-    for arch in BUCKETS:
+    for arch in ARCH:
         single_sw = Stopwatch()
         arch_tag = f"{tag}-{arch}"
         metadata_path = p.join(TEMP_PATH, arch_tag)
-        dockerfile = p.join(image.full_path, f"Dockerfile.{os}")
+        dockerfile = p.join(image.path, f"Dockerfile.{os}")
         cmd_args = list(init_args)
-        cmd_args.extend(buildx_args(bucket_prefix, arch))
+        urls = []
+        if direct_urls:
+            if os == "ubuntu" and "clickhouse-server" in image.repo:
+                urls = [url for url in direct_urls[arch] if ".deb" in url]
+            else:
+                urls = [url for url in direct_urls[arch] if ".tgz" in url]
+        cmd_args.extend(buildx_args(repo_urls, arch, direct_urls=urls))
         if not push:
             cmd_args.append(f"--tag={image.repo}:{arch_tag}")
         cmd_args.extend(
@@ -265,7 +285,7 @@ def build_and_push_image(
                 f"--build-arg=VERSION='{version.string}'",
                 "--progress=plain",
                 f"--file={dockerfile}",
-                image.full_path.as_posix(),
+                image.path.as_posix(),
             ]
         )
         cmd = " ".join(cmd_args)
@@ -323,25 +343,47 @@ def main():
     makedirs(TEMP_PATH, exist_ok=True)
 
     args = parse_args()
-    image = DockerImage(args.image_path, args.image_repo, False)
+    image = DockerImageData(args.image_path, args.image_repo, False)
     args.release_type = auto_release_type(args.version, args.release_type)
     tags = gen_tags(args.version, args.release_type)
     NAME = f"Docker image {image.repo} building check"
     pr_info = None
-    if CI:
-        pr_info = PRInfo()
-        release_or_pr, _ = get_release_or_pr(pr_info, args.version)
-        args.bucket_prefix = (
-            f"{S3_DOWNLOAD}/{S3_BUILDS_BUCKET}/{release_or_pr}/{pr_info.sha}"
-        )
+    repo_urls = dict()
+    direct_urls: Dict[str, List[str]] = dict()
+    pr_info = PRInfo()
+    release_or_pr, _ = get_release_or_pr(pr_info, args.version)
+
+    for arch, build_name in zip(ARCH, ("package_release", "package_aarch64")):
+        if not args.bucket_prefix:
+            repo_urls[
+                arch
+            ] = f"{S3_DOWNLOAD}/{S3_BUILDS_BUCKET}/{release_or_pr}/{pr_info.sha}/{build_name}"
+        else:
+            repo_urls[arch] = f"{args.bucket_prefix}/{build_name}"
+        if args.allow_build_reuse:
+            # read s3 urls from pre-downloaded build reports
+            if "clickhouse-server" in args.image_repo:
+                PACKAGES = [
+                    "clickhouse-client",
+                    "clickhouse-server",
+                    "clickhouse-common-static",
+                ]
+            elif "clickhouse-keeper" in args.image_repo:
+                PACKAGES = ["clickhouse-keeper"]
+            else:
+                assert False, "BUG"
+            urls = read_build_urls(build_name, Path(REPORT_PATH))
+            assert (
+                urls
+            ), f"URLS has not been read from build report, report path[{REPORT_PATH}], build [{build_name}]"
+            direct_urls[arch] = [
+                url
+                for url in urls
+                if any(package in url for package in PACKAGES) and "-dbg" not in url
+            ]
 
     if args.push:
-        subprocess.check_output(  # pylint: disable=unexpected-keyword-arg
-            "docker login --username 'robotclickhouse' --password-stdin",
-            input=get_parameter_from_ssm("dockerhub_robot_password"),
-            encoding="utf-8",
-            shell=True,
-        )
+        docker_login()
         NAME = f"Docker image {image.repo} build and push"
 
     logging.info("Following tags will be created: %s", ", ".join(tags))
@@ -351,7 +393,7 @@ def main():
         for tag in tags:
             test_results.extend(
                 build_and_push_image(
-                    image, args.push, args.bucket_prefix, os, tag, args.version
+                    image, args.push, repo_urls, os, tag, args.version, direct_urls
                 )
             )
             if test_results[-1].status != "OK":
@@ -373,7 +415,9 @@ def main():
 
     gh = Github(get_best_robot_token(), per_page=100)
     commit = get_commit(gh, pr_info.sha)
-    post_commit_status(commit, status, url, description, NAME, pr_info)
+    post_commit_status(
+        commit, status, url, description, NAME, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/docs_check.py b/tests/ci/docs_check.py
index 650ed93aa71..1424ab8895d 100644
--- a/tests/ci/docs_check.py
+++ b/tests/ci/docs_check.py
@@ -10,14 +10,13 @@ from github import Github
 
 from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
 from commit_status_helper import (
-    NotSet,
     RerunHelper,
     get_commit,
     post_commit_status,
     update_mergeable_check,
 )
-from docker_pull_helper import get_image_with_version
-from env_helper import TEMP_PATH, REPO_COPY, REPORTS_PATH
+from docker_images_helper import get_docker_image, pull_image
+from env_helper import TEMP_PATH, REPO_COPY
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResults, TestResult
@@ -57,8 +56,6 @@ def main():
 
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
-    reports_path = Path(REPORTS_PATH)
-    reports_path.mkdir(parents=True, exist_ok=True)
     repo_path = Path(REPO_COPY)
 
     pr_info = PRInfo(need_changed_files=True)
@@ -70,12 +67,18 @@ def main():
     if rerun_helper.is_already_finished_by_status():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
-    atexit.register(update_mergeable_check, gh, pr_info, NAME)
+    atexit.register(update_mergeable_check, commit, pr_info, NAME)
 
     if not pr_info.has_changes_in_documentation() and not args.force:
         logging.info("No changes in documentation")
         post_commit_status(
-            commit, "success", NotSet, "No changes in docs", NAME, pr_info
+            commit,
+            "success",
+            "",
+            "No changes in docs",
+            NAME,
+            pr_info,
+            dump_to_file=True,
         )
         sys.exit(0)
 
@@ -84,7 +87,7 @@ def main():
     elif args.force:
         logging.info("Check the docs because of force flag")
 
-    docker_image = get_image_with_version(reports_path, "clickhouse/docs-builder")
+    docker_image = pull_image(get_docker_image("clickhouse/docs-builder"))
 
     test_output = temp_path / "docs_check_log"
     test_output.mkdir(parents=True, exist_ok=True)
@@ -138,7 +141,9 @@ def main():
         s3_helper, pr_info.number, pr_info.sha, test_results, additional_files, NAME
     )
     print("::notice ::Report url: {report_url}")
-    post_commit_status(commit, status, report_url, description, NAME, pr_info)
+    post_commit_status(
+        commit, status, report_url, description, NAME, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/env_helper.py b/tests/ci/env_helper.py
index 6364ea0ff7c..fa09d073177 100644
--- a/tests/ci/env_helper.py
+++ b/tests/ci/env_helper.py
@@ -9,10 +9,12 @@ from build_download_helper import get_gh_api
 
 module_dir = p.abspath(p.dirname(__file__))
 git_root = p.abspath(p.join(module_dir, "..", ".."))
-
+ROOT_DIR = git_root
 CI = bool(os.getenv("CI"))
 TEMP_PATH = os.getenv("TEMP_PATH", p.abspath(p.join(module_dir, "./tmp")))
-
+REPORT_PATH = f"{TEMP_PATH}/reports"
+# FIXME: latest should not be used in CI, set temporary for transition to "docker with digest as a tag"
+DOCKER_TAG = os.getenv("DOCKER_TAG", "latest")
 CACHES_PATH = os.getenv("CACHES_PATH", TEMP_PATH)
 CLOUDFLARE_TOKEN = os.getenv("CLOUDFLARE_TOKEN")
 GITHUB_EVENT_PATH = os.getenv("GITHUB_EVENT_PATH", "")
@@ -23,7 +25,6 @@ GITHUB_SERVER_URL = os.getenv("GITHUB_SERVER_URL", "https://github.com")
 GITHUB_WORKSPACE = os.getenv("GITHUB_WORKSPACE", git_root)
 GITHUB_RUN_URL = f"{GITHUB_SERVER_URL}/{GITHUB_REPOSITORY}/actions/runs/{GITHUB_RUN_ID}"
 IMAGES_PATH = os.getenv("IMAGES_PATH", TEMP_PATH)
-REPORTS_PATH = os.getenv("REPORTS_PATH", p.abspath(p.join(module_dir, "./reports")))
 REPO_COPY = os.getenv("REPO_COPY", GITHUB_WORKSPACE)
 RUNNER_TEMP = os.getenv("RUNNER_TEMP", p.abspath(p.join(module_dir, "./tmp")))
 S3_BUILDS_BUCKET = os.getenv("S3_BUILDS_BUCKET", "clickhouse-builds")
diff --git a/tests/ci/fast_test_check.py b/tests/ci/fast_test_check.py
index ee046d6dfef..093537fdeb0 100644
--- a/tests/ci/fast_test_check.py
+++ b/tests/ci/fast_test_check.py
@@ -7,8 +7,7 @@ import csv
 import sys
 import atexit
 from pathlib import Path
-from typing import List, Tuple
-
+from typing import Tuple
 from github import Github
 
 from build_check import get_release_or_pr
@@ -23,8 +22,9 @@ from commit_status_helper import (
     update_mergeable_check,
     format_description,
 )
-from docker_pull_helper import get_image_with_version, DockerImage
-from env_helper import S3_BUILDS_BUCKET, TEMP_PATH, REPO_COPY, REPORTS_PATH
+
+from docker_images_helper import DockerImage, get_docker_image, pull_image
+from env_helper import S3_BUILDS_BUCKET, TEMP_PATH, REPO_COPY
 from get_robot_token import get_best_robot_token
 from pr_info import FORCE_TESTS_LABEL, PRInfo
 from report import TestResult, TestResults, read_test_results
@@ -72,7 +72,7 @@ def process_results(result_directory: Path) -> Tuple[str, str, TestResults]:
     status = []
     status_path = result_directory / "check_status.tsv"
     if status_path.exists():
-        logging.info("Found test_results.tsv")
+        logging.info("Found %s", status_path.name)
         with open(status_path, "r", encoding="utf-8") as status_file:
             status = list(csv.reader(status_file, delimiter="\t"))
     if len(status) != 1 or len(status[0]) != 2:
@@ -118,15 +118,13 @@ def main():
 
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
-    reports_path = Path(REPORTS_PATH)
-    reports_path.mkdir(parents=True, exist_ok=True)
 
     pr_info = PRInfo()
 
     gh = Github(get_best_robot_token(), per_page=100)
     commit = get_commit(gh, pr_info.sha)
 
-    atexit.register(update_mergeable_check, gh, pr_info, NAME)
+    atexit.register(update_mergeable_check, commit, pr_info, NAME)
 
     rerun_helper = RerunHelper(commit, NAME)
     if rerun_helper.is_already_finished_by_status():
@@ -136,7 +134,7 @@ def main():
             sys.exit(1)
         sys.exit(0)
 
-    docker_image = get_image_with_version(reports_path, "clickhouse/fasttest")
+    docker_image = pull_image(get_docker_image("clickhouse/fasttest"))
 
     s3_helper = S3Helper()
 
@@ -233,7 +231,9 @@ def main():
         build_urls,
     )
     print(f"::notice ::Report url: {report_url}")
-    post_commit_status(commit, state, report_url, description, NAME, pr_info)
+    post_commit_status(
+        commit, state, report_url, description, NAME, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/finish_check.py b/tests/ci/finish_check.py
index 74392947b82..6c615817164 100644
--- a/tests/ci/finish_check.py
+++ b/tests/ci/finish_check.py
@@ -4,7 +4,6 @@ from github import Github
 
 from commit_status_helper import (
     CI_STATUS_NAME,
-    NotSet,
     get_commit,
     get_commit_filtered_statuses,
     post_commit_status,
@@ -19,9 +18,9 @@ def main():
 
     pr_info = PRInfo(need_orgs=True)
     gh = Github(get_best_robot_token(), per_page=100)
-    # Update the Mergeable Check at the final step
-    update_mergeable_check(gh, pr_info, CI_STATUS_NAME)
     commit = get_commit(gh, pr_info.sha)
+    # Update the Mergeable Check at the final step
+    update_mergeable_check(commit, pr_info, CI_STATUS_NAME)
 
     statuses = [
         status
@@ -36,10 +35,11 @@ def main():
         post_commit_status(
             commit,
             "success",
-            status.target_url or NotSet,
+            status.target_url,
             "All checks finished",
             CI_STATUS_NAME,
             pr_info,
+            dump_to_file=True,
         )
 
 
diff --git a/tests/ci/functional_test_check.py b/tests/ci/functional_test_check.py
index f85c44f617d..4d81161b6de 100644
--- a/tests/ci/functional_test_check.py
+++ b/tests/ci/functional_test_check.py
@@ -20,7 +20,6 @@ from clickhouse_helper import (
     prepare_tests_results_for_clickhouse,
 )
 from commit_status_helper import (
-    NotSet,
     RerunHelper,
     get_commit,
     override_status,
@@ -28,9 +27,9 @@ from commit_status_helper import (
     post_commit_status_to_file,
     update_mergeable_check,
 )
-from docker_pull_helper import DockerImage, get_image_with_version
+from docker_images_helper import DockerImage, pull_image, get_docker_image
 from download_release_packages import download_last_release
-from env_helper import TEMP_PATH, REPO_COPY, REPORTS_PATH
+from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
 from get_robot_token import get_best_robot_token
 from pr_info import FORCE_TESTS_LABEL, PRInfo
 from report import TestResults, read_test_results
@@ -169,7 +168,7 @@ def process_results(
     status = []
     status_path = result_directory / "check_status.tsv"
     if status_path.exists():
-        logging.info("Found test_results.tsv")
+        logging.info("Found %s", status_path.name)
         with open(status_path, "r", encoding="utf-8") as status_file:
             status = list(csv.reader(status_file, delimiter="\t"))
 
@@ -225,16 +224,24 @@ def main():
     stopwatch = Stopwatch()
 
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
+    reports_path.mkdir(parents=True, exist_ok=True)
 
     repo_path = Path(REPO_COPY)
-    reports_path = Path(REPORTS_PATH)
     post_commit_path = temp_path / "functional_commit_status.tsv"
 
     args = parse_args()
-    check_name = args.check_name
-    kill_timeout = args.kill_timeout
+    check_name = args.check_name or os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
+    kill_timeout = args.kill_timeout or int(os.getenv("KILL_TIMEOUT", "0"))
+    assert (
+        kill_timeout > 0
+    ), "kill timeout must be provided as an input arg or in KILL_TIMEOUT env"
     validate_bugfix_check = args.validate_bugfix
+    print(f"Runnin check [{check_name}] with timeout [{kill_timeout}]")
 
     flaky_check = "flaky" in check_name.lower()
 
@@ -247,7 +254,7 @@ def main():
     )
 
     commit = get_commit(gh, pr_info.sha)
-    atexit.register(update_mergeable_check, gh, pr_info, check_name)
+    atexit.register(update_mergeable_check, commit, pr_info, check_name)
 
     if validate_bugfix_check and "pr-bugfix" not in pr_info.labels:
         if args.post_commit_status == "file":
@@ -285,10 +292,11 @@ def main():
                 post_commit_status(
                     commit,
                     state,
-                    NotSet,
+                    "",
                     NO_CHANGES_MSG,
                     check_name_with_group,
                     pr_info,
+                    dump_to_file=True,
                 )
             elif args.post_commit_status == "file":
                 post_commit_status_to_file(
@@ -300,7 +308,8 @@ def main():
             sys.exit(0)
 
     image_name = get_image_name(check_name)
-    docker_image = get_image_with_version(reports_path, image_name)
+
+    docker_image = pull_image(get_docker_image(image_name))
 
     packages_path = temp_path / "packages"
     packages_path.mkdir(parents=True, exist_ok=True)
@@ -379,7 +388,13 @@ def main():
     print(f"::notice:: {check_name} Report url: {report_url}")
     if args.post_commit_status == "commit_status":
         post_commit_status(
-            commit, state, report_url, description, check_name_with_group, pr_info
+            commit,
+            state,
+            report_url,
+            description,
+            check_name_with_group,
+            pr_info,
+            dump_to_file=True,
         )
     elif args.post_commit_status == "file":
         post_commit_status_to_file(
diff --git a/tests/ci/git_helper.py b/tests/ci/git_helper.py
index 9927d5a4248..598ffbafb51 100644
--- a/tests/ci/git_helper.py
+++ b/tests/ci/git_helper.py
@@ -19,6 +19,13 @@ SHA_REGEXP = re.compile(r"\A([0-9]|[a-f]){40}\Z")
 CWD = p.dirname(p.realpath(__file__))
 TWEAK = 1
 
+GIT_PREFIX = (  # All commits to remote are done as robot-clickhouse
+    "git -c user.email=robot-clickhouse@users.noreply.github.com "
+    "-c user.name=robot-clickhouse -c commit.gpgsign=false "
+    "-c core.sshCommand="
+    "'ssh -o UserKnownHostsFile=/dev/null -o StrictHostKeyChecking=no'"
+)
+
 
 # Py 3.8 removeprefix and removesuffix
 def removeprefix(string: str, prefix: str) -> str:
diff --git a/tests/ci/github_helper.py b/tests/ci/github_helper.py
index 15ee7dc9620..ae1eaf4c06a 100644
--- a/tests/ci/github_helper.py
+++ b/tests/ci/github_helper.py
@@ -1,9 +1,10 @@
 #!/usr/bin/env python
 """Helper for GitHub API requests"""
 import logging
+import re
 from datetime import date, datetime, timedelta
-from pathlib import Path
 from os import path as p
+from pathlib import Path
 from time import sleep
 from typing import List, Optional, Tuple, Union
 
@@ -143,7 +144,9 @@ class GitHub(github.Github):
     def get_pull_cached(
         self, repo: Repository, number: int, obj_updated_at: Optional[datetime] = None
     ) -> PullRequest:
-        cache_file = self.cache_path / f"pr-{number}.pickle"
+        # clean any special symbol from the repo name, especially '/'
+        repo_name = re.sub(r"\W", "_", repo.full_name)
+        cache_file = self.cache_path / f"pr-{repo_name}-{number}.pickle"
 
         if cache_file.is_file():
             is_updated, cached_pr = self._is_cache_updated(cache_file, obj_updated_at)
@@ -192,6 +195,32 @@ class GitHub(github.Github):
         with open(path, "rb") as ob_fd:
             return self.load(ob_fd)  # type: ignore
 
+    # pylint: disable=protected-access
+    @staticmethod
+    def toggle_pr_draft(pr: PullRequest) -> None:
+        """GH rest API does not provide a way to toggle the draft status for PR"""
+        node_id = pr._rawData["node_id"]
+        if pr.draft:
+            action = (
+                "mutation PullRequestReadyForReview($input:MarkPullRequestReadyForReviewInput!)"
+                "{markPullRequestReadyForReview(input: $input){pullRequest{id}}}"
+            )
+        else:
+            action = (
+                "mutation ConvertPullRequestToDraft($input:ConvertPullRequestToDraftInput!)"
+                "{convertPullRequestToDraft(input: $input){pullRequest{id}}}"
+            )
+        query = {
+            "query": action,
+            "variables": {"input": {"pullRequestId": node_id}},
+        }
+        url = f"{pr._requester.base_url}/graphql"
+        _, data = pr._requester.requestJsonAndCheck("POST", url, input=query)
+        if data.get("data"):
+            pr._draft = pr._makeBoolAttribute(not pr.draft)
+
+    # pylint: enable=protected-access
+
     def _is_cache_updated(
         self, cache_file: Path, obj_updated_at: Optional[datetime]
     ) -> Tuple[bool, object]:
diff --git a/tests/ci/install_check.py b/tests/ci/install_check.py
index 9971d0c236c..5ef65f3f38b 100644
--- a/tests/ci/install_check.py
+++ b/tests/ci/install_check.py
@@ -25,8 +25,8 @@ from commit_status_helper import (
     update_mergeable_check,
 )
 from compress_files import compress_fast
-from docker_pull_helper import get_image_with_version, DockerImage
-from env_helper import CI, TEMP_PATH as TEMP, REPORTS_PATH
+from docker_images_helper import DockerImage, pull_image, get_docker_image
+from env_helper import CI, REPORT_PATH, TEMP_PATH as TEMP
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResults, TestResult, FAILURE, FAIL, OK, SUCCESS
@@ -151,7 +151,7 @@ def test_install_tgz(image: DockerImage) -> TestResults:
     # FIXME: I couldn't find why Type=notify is broken in centos:8
     # systemd just ignores the watchdog completely
     tests = {
-        f"Install server tgz in {image.name}": r"""#!/bin/bash -ex
+        f"Install server tgz in {image}": r"""#!/bin/bash -ex
 [ -f /etc/debian_version ] && CONFIGURE=configure || CONFIGURE=
 for pkg in /packages/clickhouse-{common,client,server}*tgz; do
     package=${pkg%-*}
@@ -161,7 +161,7 @@ for pkg in /packages/clickhouse-{common,client,server}*tgz; do
 done
 [ -f /etc/yum.conf ] && echo CLICKHOUSE_WATCHDOG_ENABLE=0 > /etc/default/clickhouse-server
 bash -ex /packages/server_test.sh""",
-        f"Install keeper tgz in {image.name}": r"""#!/bin/bash -ex
+        f"Install keeper tgz in {image}": r"""#!/bin/bash -ex
 [ -f /etc/debian_version ] && CONFIGURE=configure || CONFIGURE=
 for pkg in /packages/clickhouse-keeper*tgz; do
     package=${pkg%-*}
@@ -224,7 +224,6 @@ def parse_args() -> argparse.Namespace:
         formatter_class=argparse.ArgumentDefaultsHelpFormatter,
         description="The script to check if the packages are able to install",
     )
-
     parser.add_argument(
         "check_name",
         help="check name, used to download the packages",
@@ -280,7 +279,7 @@ def main():
     if CI:
         gh = Github(get_best_robot_token(), per_page=100)
         commit = get_commit(gh, pr_info.sha)
-        atexit.register(update_mergeable_check, gh, pr_info, args.check_name)
+        atexit.register(update_mergeable_check, commit, pr_info, args.check_name)
 
         rerun_helper = RerunHelper(commit, args.check_name)
         if rerun_helper.is_already_finished_by_status():
@@ -289,10 +288,9 @@ def main():
             )
             sys.exit(0)
 
-    docker_images = {
-        name: get_image_with_version(REPORTS_PATH, name, args.download)
-        for name in (RPM_IMAGE, DEB_IMAGE)
-    }
+    deb_image = pull_image(get_docker_image(DEB_IMAGE))
+    rpm_image = pull_image(get_docker_image(RPM_IMAGE))
+
     prepare_test_scripts()
 
     if args.download:
@@ -312,7 +310,7 @@ def main():
             return is_match
 
         download_builds_filter(
-            args.check_name, REPORTS_PATH, TEMP_PATH, filter_artifacts
+            args.check_name, REPORT_PATH, TEMP_PATH, filter_artifacts
         )
 
     test_results = []  # type: TestResults
@@ -325,12 +323,12 @@ def main():
         subprocess.check_output(f"{ch_copy.absolute()} local -q 'SELECT 1'", shell=True)
 
     if args.deb:
-        test_results.extend(test_install_deb(docker_images[DEB_IMAGE]))
+        test_results.extend(test_install_deb(deb_image))
     if args.rpm:
-        test_results.extend(test_install_rpm(docker_images[RPM_IMAGE]))
+        test_results.extend(test_install_rpm(rpm_image))
     if args.tgz:
-        test_results.extend(test_install_tgz(docker_images[DEB_IMAGE]))
-        test_results.extend(test_install_tgz(docker_images[RPM_IMAGE]))
+        test_results.extend(test_install_tgz(deb_image))
+        test_results.extend(test_install_tgz(rpm_image))
 
     state = SUCCESS
     test_status = OK
@@ -360,7 +358,15 @@ def main():
 
     description = format_description(description)
 
-    post_commit_status(commit, state, report_url, description, args.check_name, pr_info)
+    post_commit_status(
+        commit,
+        state,
+        report_url,
+        description,
+        args.check_name,
+        pr_info,
+        dump_to_file=True,
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/integration_test_check.py b/tests/ci/integration_test_check.py
index 8535d71c5c4..c65f162f770 100644
--- a/tests/ci/integration_test_check.py
+++ b/tests/ci/integration_test_check.py
@@ -10,13 +10,8 @@ import sys
 from pathlib import Path
 from typing import Dict, List, Tuple
 
-from github import Github
-
 from build_download_helper import download_all_deb_packages
-from clickhouse_helper import (
-    ClickHouseHelper,
-    prepare_tests_results_for_clickhouse,
-)
+from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
 from commit_status_helper import (
     RerunHelper,
     get_commit,
@@ -24,10 +19,12 @@ from commit_status_helper import (
     post_commit_status,
     post_commit_status_to_file,
 )
-from docker_pull_helper import get_images_with_versions, DockerImage
+from docker_images_helper import DockerImage, get_docker_image, pull_image
 from download_release_packages import download_last_release
-from env_helper import TEMP_PATH, REPO_COPY, REPORTS_PATH
+from env_helper import REPO_COPY, REPORT_PATH, TEMP_PATH
 from get_robot_token import get_best_robot_token
+from github_helper import GitHub
+from integration_test_images import IMAGES
 from pr_info import PRInfo
 from report import ERROR, TestResult, TestResults, read_test_results
 from s3_helper import S3Helper
@@ -36,24 +33,6 @@ from tee_popen import TeePopen
 from upload_result_helper import upload_results
 
 
-# When update, update
-# tests/integration/ci-runner.py:ClickhouseIntegrationTestsRunner.get_images_names too
-IMAGES = [
-    "clickhouse/dotnet-client",
-    "clickhouse/integration-helper",
-    "clickhouse/integration-test",
-    "clickhouse/integration-tests-runner",
-    "clickhouse/kerberized-hadoop",
-    "clickhouse/kerberos-kdc",
-    "clickhouse/mysql-golang-client",
-    "clickhouse/mysql-java-client",
-    "clickhouse/mysql-js-client",
-    "clickhouse/mysql-php-client",
-    "clickhouse/nginx-dav",
-    "clickhouse/postgresql-java-client",
-]
-
-
 def get_json_params_dict(
     check_name: str,
     pr_info: PRInfo,
@@ -118,7 +97,7 @@ def process_results(
     status = []
     status_path = result_directory / "check_status.tsv"
     if status_path.exists():
-        logging.info("Found test_results.tsv")
+        logging.info("Found %s", status_path.name)
         with open(status_path, "r", encoding="utf-8") as status_file:
             status = list(csv.reader(status_file, delimiter="\t"))
 
@@ -166,14 +145,17 @@ def main():
     stopwatch = Stopwatch()
 
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
 
     post_commit_path = temp_path / "integration_commit_status.tsv"
     repo_path = Path(REPO_COPY)
-    reports_path = Path(REPORTS_PATH)
 
     args = parse_args()
-    check_name = args.check_name
+    check_name = args.check_name or os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided in --check-name input option or in CHECK_NAME env"
     validate_bugfix_check = args.validate_bugfix
 
     if "RUN_BY_HASH_NUM" in os.environ:
@@ -207,7 +189,7 @@ def main():
         logging.info("Skipping '%s' (no pr-bugfix in '%s')", check_name, pr_info.labels)
         sys.exit(0)
 
-    gh = Github(get_best_robot_token(), per_page=100)
+    gh = GitHub(get_best_robot_token())
     commit = get_commit(gh, pr_info.sha)
 
     rerun_helper = RerunHelper(commit, check_name_with_group)
@@ -215,7 +197,7 @@ def main():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    images = get_images_with_versions(reports_path, IMAGES)
+    images = [pull_image(get_docker_image(i)) for i in IMAGES]
     result_path = temp_path / "output_dir"
     result_path.mkdir(parents=True, exist_ok=True)
 
@@ -310,7 +292,13 @@ def main():
     print(f"::notice:: {check_name} Report url: {report_url}")
     if args.post_commit_status == "commit_status":
         post_commit_status(
-            commit, state, report_url, description, check_name_with_group, pr_info
+            commit,
+            state,
+            report_url,
+            description,
+            check_name_with_group,
+            pr_info,
+            dump_to_file=True,
         )
     elif args.post_commit_status == "file":
         post_commit_status_to_file(post_commit_path, description, state, report_url)
diff --git a/tests/ci/integration_test_images.py b/tests/ci/integration_test_images.py
new file mode 100644
index 00000000000..8148ac61181
--- /dev/null
+++ b/tests/ci/integration_test_images.py
@@ -0,0 +1,31 @@
+#!/usr/bin/env python3
+
+IMAGES_ENV = {
+    "clickhouse/dotnet-client": "DOCKER_DOTNET_CLIENT_TAG",
+    "clickhouse/integration-helper": "DOCKER_HELPER_TAG",
+    "clickhouse/integration-test": "DOCKER_BASE_TAG",
+    "clickhouse/integration-tests-runner": "",
+    "clickhouse/kerberized-hadoop": "DOCKER_KERBERIZED_HADOOP_TAG",
+    "clickhouse/kerberos-kdc": "DOCKER_KERBEROS_KDC_TAG",
+    "clickhouse/mysql-golang-client": "DOCKER_MYSQL_GOLANG_CLIENT_TAG",
+    "clickhouse/mysql-java-client": "DOCKER_MYSQL_JAVA_CLIENT_TAG",
+    "clickhouse/mysql-js-client": "DOCKER_MYSQL_JS_CLIENT_TAG",
+    "clickhouse/mysql-php-client": "DOCKER_MYSQL_PHP_CLIENT_TAG",
+    "clickhouse/nginx-dav": "DOCKER_NGINX_DAV_TAG",
+    "clickhouse/postgresql-java-client": "DOCKER_POSTGRESQL_JAVA_CLIENT_TAG",
+    "clickhouse/python-bottle": "DOCKER_PYTHON_BOTTLE_TAG",
+}
+
+IMAGES = list(IMAGES_ENV.keys())
+
+
+def get_image_env(image: str) -> str:
+    return IMAGES_ENV.get(image, "")
+
+
+def get_docker_env(image: str, tag: str) -> str:
+    "if image belongs to IMAGES_ENV, return `-e` argument for docker command"
+    env = get_image_env(image)
+    if not env:
+        return env
+    return f"-e {env}={tag} "
diff --git a/tests/ci/jepsen_check.py b/tests/ci/jepsen_check.py
index 94ec8f93790..73ae231e7b7 100644
--- a/tests/ci/jepsen_check.py
+++ b/tests/ci/jepsen_check.py
@@ -292,7 +292,9 @@ def main():
     )
 
     print(f"::notice ::Report url: {report_url}")
-    post_commit_status(commit, status, report_url, description, check_name, pr_info)
+    post_commit_status(
+        commit, status, report_url, description, check_name, pr_info, dump_to_file=True
+    )
 
     ch_helper = ClickHouseHelper()
     prepared_events = prepare_tests_results_for_clickhouse(
diff --git a/tests/ci/libfuzzer_test_check.py b/tests/ci/libfuzzer_test_check.py
index e768b7f1b4e..6de0614541a 100644
--- a/tests/ci/libfuzzer_test_check.py
+++ b/tests/ci/libfuzzer_test_check.py
@@ -20,9 +20,9 @@ from commit_status_helper import (
     get_commit,
     update_mergeable_check,
 )
-from docker_pull_helper import DockerImage, get_image_with_version
+from docker_images_helper import DockerImage, pull_image, get_docker_image
 
-from env_helper import TEMP_PATH, REPO_COPY, REPORTS_PATH
+from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResults
@@ -107,8 +107,9 @@ def main():
     stopwatch = Stopwatch()
 
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
+    temp_path.mkdir(parents=True, exist_ok=True)
     repo_path = Path(REPO_COPY)
-    reports_path = REPORTS_PATH
 
     args = parse_args()
     check_name = args.check_name
@@ -117,7 +118,7 @@ def main():
     gh = Github(get_best_robot_token(), per_page=100)
     pr_info = PRInfo()
     commit = get_commit(gh, pr_info.sha)
-    atexit.register(update_mergeable_check, gh, pr_info, check_name)
+    atexit.register(update_mergeable_check, commit, pr_info, check_name)
 
     temp_path.mkdir(parents=True, exist_ok=True)
 
@@ -137,7 +138,7 @@ def main():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    docker_image = get_image_with_version(reports_path, "clickhouse/libfuzzer")
+    docker_image = pull_image(get_docker_image("clickhouse/libfuzzer"))
 
     fuzzers_path = temp_path / "fuzzers"
     fuzzers_path.mkdir(parents=True, exist_ok=True)
diff --git a/tests/ci/mark_release_ready.py b/tests/ci/mark_release_ready.py
index 4501d40e4d3..0ad4b2bd2ed 100755
--- a/tests/ci/mark_release_ready.py
+++ b/tests/ci/mark_release_ready.py
@@ -4,7 +4,7 @@ import argparse
 import logging
 import os
 
-from commit_status_helper import NotSet, get_commit, post_commit_status
+from commit_status_helper import get_commit, post_commit_status
 from env_helper import GITHUB_JOB_URL
 from get_robot_token import get_best_robot_token
 from github_helper import GitHub
@@ -49,7 +49,13 @@ def main():
     commit = get_commit(gh, args.commit)
     gh.get_rate_limit()
     post_commit_status(
-        commit, "success", url or NotSet, description, RELEASE_READY_STATUS, pr_info
+        commit,
+        "success",
+        url,
+        description,
+        RELEASE_READY_STATUS,
+        pr_info,
+        dump_to_file=True,
     )
 
 
diff --git a/tests/ci/performance_comparison_check.py b/tests/ci/performance_comparison_check.py
index 81096d5d602..75f40ae7feb 100644
--- a/tests/ci/performance_comparison_check.py
+++ b/tests/ci/performance_comparison_check.py
@@ -14,15 +14,15 @@ from github import Github
 
 from commit_status_helper import RerunHelper, get_commit, post_commit_status
 from ci_config import CI_CONFIG
-from docker_pull_helper import get_image_with_version
+from docker_images_helper import pull_image, get_docker_image
 from env_helper import (
     GITHUB_EVENT_PATH,
     GITHUB_RUN_URL,
     REPO_COPY,
-    REPORTS_PATH,
     S3_BUILDS_BUCKET,
     S3_DOWNLOAD,
     TEMP_PATH,
+    REPORT_PATH,
 )
 from get_robot_token import get_best_robot_token, get_parameter_from_ssm
 from pr_info import PRInfo
@@ -30,6 +30,7 @@ from s3_helper import S3Helper
 from tee_popen import TeePopen
 from clickhouse_helper import get_instance_type, get_instance_id
 from stopwatch import Stopwatch
+from build_download_helper import download_builds_filter
 
 IMAGE_NAME = "clickhouse/performance-comparison"
 
@@ -63,6 +64,7 @@ def get_run_command(
         f"docker run --privileged --volume={workspace}:/workspace "
         f"--volume={result_path}:/output "
         f"--volume={repo_tests_path}:/usr/share/clickhouse-test "
+        f"--volume={TEMP_PATH}:/artifacts "
         f"--cap-add syslog --cap-add sys_admin --cap-add sys_rawio "
         f"{env_str} {additional_env} "
         f"{image}"
@@ -77,9 +79,11 @@ def main():
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
     repo_tests_path = Path(REPO_COPY, "tests")
-    reports_path = Path(REPORTS_PATH)
 
-    check_name = sys.argv[1]
+    check_name = sys.argv[1] if len(sys.argv) > 1 else os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
     required_build = CI_CONFIG.test_configs[check_name].required_build
 
     with open(GITHUB_EVENT_PATH, "r", encoding="utf-8") as event_file:
@@ -123,7 +127,13 @@ def main():
         message = "Skipped, not labeled with 'pr-performance'"
         report_url = GITHUB_RUN_URL
         post_commit_status(
-            commit, status, report_url, message, check_name_with_group, pr_info
+            commit,
+            status,
+            report_url,
+            message,
+            check_name_with_group,
+            pr_info,
+            dump_to_file=True,
         )
         sys.exit(0)
 
@@ -141,7 +151,7 @@ def main():
         .replace("/", "_")
     )
 
-    docker_image = get_image_with_version(reports_path, IMAGE_NAME)
+    docker_image = pull_image(get_docker_image(IMAGE_NAME))
 
     result_path = temp_path / "result"
     result_path.mkdir(parents=True, exist_ok=True)
@@ -158,6 +168,11 @@ def main():
         "CLICKHOUSE_PERFORMANCE_COMPARISON_CHECK_NAME_PREFIX": check_name_prefix,
     }
 
+    download_builds_filter(
+        check_name, REPORT_PATH, TEMP_PATH, lambda url: "performance.tar.zst" in url
+    )
+    assert os.path.exists(f"{TEMP_PATH}/performance.tar.zst"), "Perf artifact not found"
+
     docker_env += "".join([f" -e {name}" for name in env_extra])
 
     run_command = get_run_command(
@@ -264,7 +279,13 @@ def main():
     )
 
     post_commit_status(
-        commit, status, report_url, message, check_name_with_group, pr_info
+        commit,
+        status,
+        report_url,
+        message,
+        check_name_with_group,
+        pr_info,
+        dump_to_file=True,
     )
 
     if status == "error":
diff --git a/tests/ci/pr_info.py b/tests/ci/pr_info.py
index 8e7da53453f..15558c81c7e 100644
--- a/tests/ci/pr_info.py
+++ b/tests/ci/pr_info.py
@@ -2,7 +2,7 @@
 import json
 import logging
 import os
-from typing import Dict, List, Set, Union, Literal
+from typing import Dict, List, Set, Union
 
 from unidiff import PatchSet  # type: ignore
 
@@ -93,6 +93,7 @@ class PRInfo:
                 github_event = PRInfo.default_event.copy()
         self.event = github_event
         self.changed_files = set()  # type: Set[str]
+        self.changed_files_requested = False
         self.body = ""
         self.diff_urls = []  # type: List[str]
         # release_pr and merged_pr are used for docker images additional cache
@@ -285,6 +286,7 @@ class PRInfo:
             response.raise_for_status()
             diff_object = PatchSet(response.text)
             self.changed_files.update({f.path for f in diff_object})
+        self.changed_files_requested = True
         print(f"Fetched info about {len(self.changed_files)} changed files")
 
     def get_dict(self):
@@ -297,9 +299,10 @@ class PRInfo:
         }
 
     def has_changes_in_documentation(self) -> bool:
-        # If the list wasn't built yet the best we can do is to
-        # assume that there were changes.
-        if self.changed_files is None or not self.changed_files:
+        if not self.changed_files_requested:
+            self.fetch_changed_files()
+
+        if not self.changed_files:
             return True
 
         for f in self.changed_files:
@@ -311,8 +314,35 @@ class PRInfo:
                 return True
         return False
 
+    def has_changes_in_documentation_only(self) -> bool:
+        """
+        checks if changes are docs related without other changes
+        FIXME: avoid hardcoding filenames here
+        """
+        if not self.changed_files_requested:
+            self.fetch_changed_files()
+
+        if not self.changed_files:
+            # if no changes at all return False
+            return False
+
+        for f in self.changed_files:
+            _, ext = os.path.splitext(f)
+            path_in_docs = f.startswith("docs/")
+            if not (
+                (ext in DIFF_IN_DOCUMENTATION_EXT and path_in_docs)
+                or "docker/docs" in f
+                or "docs_check.py" in f
+                or ext == ".md"
+            ):
+                return False
+        return True
+
     def has_changes_in_submodules(self):
-        if self.changed_files is None or not self.changed_files:
+        if not self.changed_files_requested:
+            self.fetch_changed_files()
+
+        if not self.changed_files:
             return True
 
         for f in self.changed_files:
@@ -320,75 +350,6 @@ class PRInfo:
                 return True
         return False
 
-    def can_skip_builds_and_use_version_from_master(self):
-        if FORCE_TESTS_LABEL in self.labels:
-            return False
-
-        if self.changed_files is None or not self.changed_files:
-            return False
-
-        return not any(
-            f.startswith("programs")
-            or f.startswith("src")
-            or f.startswith("base")
-            or f.startswith("cmake")
-            or f.startswith("rust")
-            or f == "CMakeLists.txt"
-            or f == "tests/ci/build_check.py"
-            for f in self.changed_files
-        )
-
-    def can_skip_integration_tests(self, versions: List[str]) -> bool:
-        if FORCE_TESTS_LABEL in self.labels:
-            return False
-
-        # If docker image(s) relevant to integration tests are updated
-        if any(self.sha in version for version in versions):
-            return False
-
-        if self.changed_files is None or not self.changed_files:
-            return False
-
-        if not self.can_skip_builds_and_use_version_from_master():
-            return False
-
-        # Integration tests can be skipped if integration tests are not changed
-        return not any(
-            f.startswith("tests/integration/")
-            or f == "tests/ci/integration_test_check.py"
-            for f in self.changed_files
-        )
-
-    def can_skip_functional_tests(
-        self, version: str, test_type: Literal["stateless", "stateful"]
-    ) -> bool:
-        if FORCE_TESTS_LABEL in self.labels:
-            return False
-
-        # If docker image(s) relevant to functional tests are updated
-        if self.sha in version:
-            return False
-
-        if self.changed_files is None or not self.changed_files:
-            return False
-
-        if not self.can_skip_builds_and_use_version_from_master():
-            return False
-
-        # Functional tests can be skipped if queries tests are not changed
-        if test_type == "stateless":
-            return not any(
-                f.startswith("tests/queries/0_stateless")
-                or f == "tests/ci/functional_test_check.py"
-                for f in self.changed_files
-            )
-        else:  # stateful
-            return not any(
-                f.startswith("tests/queries/1_stateful")
-                or f == "tests/ci/functional_test_check.py"
-                for f in self.changed_files
-            )
-
 
 class FakePRInfo:
     def __init__(self):
diff --git a/tests/ci/report.py b/tests/ci/report.py
index ba2377faa36..bf400aebd4b 100644
--- a/tests/ci/report.py
+++ b/tests/ci/report.py
@@ -415,10 +415,13 @@ class BuildResult:
     def _set_properties(self) -> None:
         if all(p is not None for p in (self._job_name, self._job_html_url)):
             return
-        try:
-            job_data = get_gh_api(self.job_api_url).json()
-        except Exception:
-            job_data = {}
+        job_data = {}
+        # quick check @self.job_api_url is valid url before request. it's set to "missing" for dummy BuildResult
+        if "http" in self.job_api_url:
+            try:
+                job_data = get_gh_api(self.job_api_url).json()
+            except Exception:
+                pass
         # job_name can be set manually
         self._job_name = self._job_name or job_data.get("name", "unknown")
         self._job_html_url = job_data.get("html_url", "")
diff --git a/tests/ci/run_check.py b/tests/ci/run_check.py
index 231e2617a3f..108aa7d1946 100644
--- a/tests/ci/run_check.py
+++ b/tests/ci/run_check.py
@@ -1,4 +1,5 @@
 #!/usr/bin/env python3
+import atexit
 import sys
 import logging
 from typing import Tuple
@@ -7,16 +8,14 @@ from github import Github
 
 from commit_status_helper import (
     CI_STATUS_NAME,
-    NotSet,
     create_ci_report,
     format_description,
     get_commit,
     post_commit_status,
     post_labels,
     remove_labels,
-    set_mergeable_check,
+    update_mergeable_check,
 )
-from docs_check import NAME as DOCS_NAME
 from env_helper import GITHUB_REPOSITORY, GITHUB_SERVER_URL
 from get_robot_token import get_best_robot_token
 from pr_info import FORCE_TESTS_LABEL, PRInfo
@@ -25,6 +24,7 @@ from lambda_shared_package.lambda_shared.pr import (
     TRUSTED_CONTRIBUTORS,
     check_pr_description,
 )
+from report import FAILURE
 
 TRUSTED_ORG_IDS = {
     54801242,  # clickhouse
@@ -32,9 +32,9 @@ TRUSTED_ORG_IDS = {
 
 OK_SKIP_LABELS = {"release", "pr-backport", "pr-cherrypick"}
 CAN_BE_TESTED_LABEL = "can be tested"
-DO_NOT_TEST_LABEL = "do not test"
 FEATURE_LABEL = "pr-feature"
 SUBMODULE_CHANGED_LABEL = "submodule changed"
+PR_CHECK = "PR Check"
 
 
 def pr_is_by_trusted_user(pr_user_login, pr_user_orgs):
@@ -59,24 +59,16 @@ def pr_is_by_trusted_user(pr_user_login, pr_user_orgs):
 
 # Returns whether we should look into individual checks for this PR. If not, it
 # can be skipped entirely.
-# Returns can_run, description, labels_state
-def should_run_ci_for_pr(pr_info: PRInfo) -> Tuple[bool, str, str]:
+# Returns can_run, description
+def should_run_ci_for_pr(pr_info: PRInfo) -> Tuple[bool, str]:
     # Consider the labels and whether the user is trusted.
     print("Got labels", pr_info.labels)
     if FORCE_TESTS_LABEL in pr_info.labels:
         print(f"Label '{FORCE_TESTS_LABEL}' set, forcing remaining checks")
-        return True, f"Labeled '{FORCE_TESTS_LABEL}'", "pending"
-
-    if DO_NOT_TEST_LABEL in pr_info.labels:
-        print(f"Label '{DO_NOT_TEST_LABEL}' set, skipping remaining checks")
-        return False, f"Labeled '{DO_NOT_TEST_LABEL}'", "success"
+        return True, f"Labeled '{FORCE_TESTS_LABEL}'"
 
     if OK_SKIP_LABELS.intersection(pr_info.labels):
-        return (
-            True,
-            "Don't try new checks for release/backports/cherry-picks",
-            "success",
-        )
+        return True, "Don't try new checks for release/backports/cherry-picks"
 
     if CAN_BE_TESTED_LABEL not in pr_info.labels and not pr_is_by_trusted_user(
         pr_info.user_login, pr_info.user_orgs
@@ -84,9 +76,9 @@ def should_run_ci_for_pr(pr_info: PRInfo) -> Tuple[bool, str, str]:
         print(
             f"PRs by untrusted users need the '{CAN_BE_TESTED_LABEL}' label - please contact a member of the core team"
         )
-        return False, "Needs 'can be tested' label", "failure"
+        return False, "Needs 'can be tested' label"
 
-    return True, "No special conditions apply", "pending"
+    return True, "No special conditions apply"
 
 
 def main():
@@ -99,7 +91,7 @@ def main():
         print("::notice ::Cannot run, no PR exists for the commit")
         sys.exit(1)
 
-    can_run, description, labels_state = should_run_ci_for_pr(pr_info)
+    can_run, description = should_run_ci_for_pr(pr_info)
     if can_run and OK_SKIP_LABELS.intersection(pr_info.labels):
         print("::notice :: Early finish the check, running in a special PR")
         sys.exit(0)
@@ -107,6 +99,7 @@ def main():
     description = format_description(description)
     gh = Github(get_best_robot_token(), per_page=100)
     commit = get_commit(gh, pr_info.sha)
+    atexit.register(update_mergeable_check, commit, pr_info, PR_CHECK)
 
     description_error, category = check_pr_description(pr_info.body, GITHUB_REPOSITORY)
     pr_labels_to_add = []
@@ -137,21 +130,6 @@ def main():
     if pr_labels_to_remove:
         remove_labels(gh, pr_info, pr_labels_to_remove)
 
-    if FEATURE_LABEL in pr_info.labels and not pr_info.has_changes_in_documentation():
-        print(
-            f"The '{FEATURE_LABEL}' in the labels, "
-            "but there's no changed documentation"
-        )
-        post_commit_status(  # do not pass pr_info here intentionally
-            commit,
-            "failure",
-            NotSet,
-            f"expect adding docs for {FEATURE_LABEL}",
-            DOCS_NAME,
-            pr_info,
-        )
-        sys.exit(0)
-
     if description_error:
         print(
             "::error ::Cannot run, PR description does not match the template: "
@@ -171,24 +149,40 @@ def main():
             "failure",
             url,
             format_description(description_error),
-            CI_STATUS_NAME,
+            PR_CHECK,
             pr_info,
         )
         sys.exit(1)
 
-    set_mergeable_check(commit, "skipped")
-    ci_report_url = create_ci_report(pr_info, [])
+    if FEATURE_LABEL in pr_info.labels and not pr_info.has_changes_in_documentation():
+        print(
+            f"The '{FEATURE_LABEL}' in the labels, "
+            "but there's no changed documentation"
+        )
+        post_commit_status(
+            commit,
+            FAILURE,
+            "",
+            f"expect adding docs for {FEATURE_LABEL}",
+            PR_CHECK,
+            pr_info,
+        )
+        # allow the workflow to continue
+
     if not can_run:
         print("::notice ::Cannot run")
-        post_commit_status(
-            commit, labels_state, ci_report_url, description, CI_STATUS_NAME, pr_info
-        )
         sys.exit(1)
-    else:
-        print("::notice ::Can run")
-        post_commit_status(
-            commit, "pending", ci_report_url, description, CI_STATUS_NAME, pr_info
-        )
+
+    ci_report_url = create_ci_report(pr_info, [])
+    print("::notice ::Can run")
+    post_commit_status(
+        commit,
+        "pending",
+        ci_report_url,
+        description,
+        CI_STATUS_NAME,
+        pr_info,
+    )
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/s3_helper.py b/tests/ci/s3_helper.py
index f94f7f60bb6..bc403aa5015 100644
--- a/tests/ci/s3_helper.py
+++ b/tests/ci/s3_helper.py
@@ -117,6 +117,40 @@ class S3Helper:
 
         return S3Helper.copy_file_to_local(S3_BUILDS_BUCKET, file_path, s3_path)
 
+    def upload_file(
+        self, bucket: str, file_path: Union[Path, str], s3_path: Union[Path, str]
+    ) -> str:
+        return self._upload_file_to_s3(bucket, Path(file_path), str(s3_path))
+
+    def download_file(
+        self, bucket: str, s3_path: str, local_file_path: Union[Path, str]
+    ) -> None:
+        if Path(local_file_path).is_dir():
+            local_file_path = Path(local_file_path) / s3_path.split("/")[-1]
+        try:
+            self.client.download_file(bucket, s3_path, local_file_path)
+        except botocore.exceptions.ClientError as e:
+            if e.response and e.response["ResponseMetadata"]["HTTPStatusCode"] == 404:
+                assert False, f"No such object [s3://{S3_BUILDS_BUCKET}/{s3_path}]"
+
+    def download_files(
+        self,
+        bucket: str,
+        s3_path: str,
+        file_suffix: str,
+        local_directory: Union[Path, str],
+    ) -> List[str]:
+        local_directory = Path(local_directory)
+        local_directory.mkdir(parents=True, exist_ok=True)
+        objects = self.list_prefix_non_recursive(s3_path)
+        res = []
+        for obj in objects:
+            if obj.endswith(file_suffix):
+                local_file_path = local_directory
+                self.download_file(bucket, obj, local_file_path)
+                res.append(obj.split("/")[-1])
+        return res
+
     def fast_parallel_upload_dir(
         self, dir_path: Path, s3_dir_path: str, bucket_name: str
     ) -> List[str]:
@@ -278,6 +312,18 @@ class S3Helper:
 
         return result
 
+    def list_prefix_non_recursive(
+        self, s3_prefix_path: str, bucket: str = S3_BUILDS_BUCKET
+    ) -> List[str]:
+        objects = self.client.list_objects_v2(Bucket=bucket, Prefix=s3_prefix_path)
+        result = []
+        if "Contents" in objects:
+            for obj in objects["Contents"]:
+                if "/" not in obj["Key"][len(s3_prefix_path) + 1 :]:
+                    result.append(obj["Key"])
+
+        return result
+
     def url_if_exists(self, key: str, bucket: str = S3_BUILDS_BUCKET) -> str:
         if not CI:
             local_path = self.local_path(bucket, key)
diff --git a/tests/ci/sqlancer_check.py b/tests/ci/sqlancer_check.py
index 47bc3b2c1e8..35641ba0455 100644
--- a/tests/ci/sqlancer_check.py
+++ b/tests/ci/sqlancer_check.py
@@ -1,6 +1,7 @@
 #!/usr/bin/env python3
 
 import logging
+import os
 import subprocess
 import sys
 from pathlib import Path
@@ -15,10 +16,10 @@ from commit_status_helper import (
     get_commit,
     post_commit_status,
 )
-from docker_pull_helper import get_image_with_version, DockerImage
+from docker_images_helper import DockerImage, pull_image, get_docker_image
 from env_helper import (
     GITHUB_RUN_URL,
-    REPORTS_PATH,
+    REPORT_PATH,
     TEMP_PATH,
 )
 from get_robot_token import get_best_robot_token
@@ -50,10 +51,12 @@ def main():
 
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
+    reports_path = Path(REPORT_PATH)
 
-    reports_path = Path(REPORTS_PATH)
-
-    check_name = sys.argv[1]
+    check_name = sys.argv[1] if len(sys.argv) > 1 else os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
 
     pr_info = PRInfo()
 
@@ -65,7 +68,7 @@ def main():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    docker_image = get_image_with_version(reports_path, IMAGE_NAME)
+    docker_image = pull_image(get_docker_image(IMAGE_NAME))
 
     build_name = get_build_name_for_check(check_name)
     urls = read_build_urls(build_name, reports_path)
@@ -147,7 +150,9 @@ def main():
         check_name,
     )
 
-    post_commit_status(commit, status, report_url, description, check_name, pr_info)
+    post_commit_status(
+        commit, status, report_url, description, check_name, pr_info, dump_to_file=True
+    )
     print(f"::notice:: {check_name} Report url: {report_url}")
 
     ch_helper = ClickHouseHelper()
diff --git a/tests/ci/sqllogic_test.py b/tests/ci/sqllogic_test.py
index 7650a4afa40..96b4de4517f 100755
--- a/tests/ci/sqllogic_test.py
+++ b/tests/ci/sqllogic_test.py
@@ -18,8 +18,8 @@ from commit_status_helper import (
     override_status,
     post_commit_status,
 )
-from docker_pull_helper import get_image_with_version, DockerImage
-from env_helper import TEMP_PATH, REPO_COPY, REPORTS_PATH
+from docker_images_helper import DockerImage, pull_image, get_docker_image
+from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import OK, FAIL, ERROR, SUCCESS, TestResults, TestResult, read_test_results
@@ -70,8 +70,16 @@ def read_check_status(result_folder: Path) -> Tuple[str, str]:
 
 def parse_args() -> argparse.Namespace:
     parser = argparse.ArgumentParser()
-    parser.add_argument("check_name")
-    parser.add_argument("kill_timeout", type=int)
+    parser.add_argument(
+        "--check-name",
+        required=False,
+        default="",
+    )
+    parser.add_argument(
+        "--kill-timeout",
+        required=False,
+        default=0,
+    )
     return parser.parse_args()
 
 
@@ -81,12 +89,20 @@ def main():
     stopwatch = Stopwatch()
 
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
     repo_path = Path(REPO_COPY)
-    reports_path = Path(REPORTS_PATH)
 
     args = parse_args()
     check_name = args.check_name
+    check_name = args.check_name or os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
+    kill_timeout = args.kill_timeout or int(os.getenv("KILL_TIMEOUT", "0"))
+    assert (
+        kill_timeout > 0
+    ), "kill timeout must be provided as an input arg or in KILL_TIMEOUT env"
 
     pr_info = PRInfo()
     gh = Github(get_best_robot_token(), per_page=100)
@@ -97,7 +113,7 @@ def main():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    docker_image = get_image_with_version(reports_path, IMAGE_NAME)
+    docker_image = pull_image(get_docker_image(IMAGE_NAME))
 
     repo_tests_path = repo_path / "tests"
 
@@ -123,7 +139,7 @@ def main():
     )
     logging.info("Going to run func tests: %s", run_command)
 
-    with TeePopen(run_command, run_log_path, timeout=args.kill_timeout) as process:
+    with TeePopen(run_command, run_log_path, timeout=kill_timeout) as process:
         retcode = process.wait()
         if retcode == 0:
             logging.info("Run successfully")
@@ -190,7 +206,9 @@ def main():
     assert description is not None
     # FIXME: force SUCCESS until all cases are fixed
     status = SUCCESS
-    post_commit_status(commit, status, report_url, description, check_name, pr_info)
+    post_commit_status(
+        commit, status, report_url, description, check_name, pr_info, dump_to_file=True
+    )
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/sqltest.py b/tests/ci/sqltest.py
index a4eb1b23349..edb64d9f106 100644
--- a/tests/ci/sqltest.py
+++ b/tests/ci/sqltest.py
@@ -16,10 +16,10 @@ from commit_status_helper import (
     get_commit,
     post_commit_status,
 )
-from docker_pull_helper import get_image_with_version
+from docker_images_helper import pull_image, get_docker_image
 from env_helper import (
     GITHUB_RUN_URL,
-    REPORTS_PATH,
+    REPORT_PATH,
     TEMP_PATH,
 )
 from get_robot_token import get_best_robot_token
@@ -50,9 +50,13 @@ def main():
     stopwatch = Stopwatch()
 
     temp_path = Path(TEMP_PATH)
-    reports_path = Path(REPORTS_PATH)
+    reports_path = Path(REPORT_PATH)
+    temp_path.mkdir(parents=True, exist_ok=True)
 
-    check_name = sys.argv[1]
+    check_name = sys.argv[1] if len(sys.argv) > 1 else os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
 
     temp_path.mkdir(parents=True, exist_ok=True)
 
@@ -66,7 +70,7 @@ def main():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    docker_image = get_image_with_version(reports_path, IMAGE_NAME)
+    docker_image = pull_image(get_docker_image(IMAGE_NAME))
 
     build_name = get_build_name_for_check(check_name)
     print(build_name)
@@ -150,7 +154,9 @@ def main():
 
     logging.info("Result: '%s', '%s', '%s'", status, description, report_url)
     print(f"::notice ::Report url: {report_url}")
-    post_commit_status(commit, status, report_url, description, check_name, pr_info)
+    post_commit_status(
+        commit, status, report_url, description, check_name, pr_info, dump_to_file=True
+    )
 
 
 if __name__ == "__main__":
diff --git a/tests/ci/stress.py b/tests/ci/stress.py
index 51f8e7d3551..49a53c9048c 100755
--- a/tests/ci/stress.py
+++ b/tests/ci/stress.py
@@ -62,6 +62,9 @@ def get_options(i: int, upgrade_check: bool) -> str:
     if random.random() < 0.1:
         client_options.append("optimize_trivial_approximate_count_query=1")
 
+    if random.random() < 0.3:
+        client_options.append(f"http_make_head_request={random.randint(0, 1)}")
+
     if client_options:
         options.append(" --client-option " + " ".join(client_options))
 
diff --git a/tests/ci/stress_check.py b/tests/ci/stress_check.py
index 56c96dc2338..05250c14fd1 100644
--- a/tests/ci/stress_check.py
+++ b/tests/ci/stress_check.py
@@ -2,6 +2,7 @@
 
 import csv
 import logging
+import os
 import subprocess
 import sys
 from pathlib import Path
@@ -21,8 +22,8 @@ from commit_status_helper import (
     post_commit_status,
     format_description,
 )
-from docker_pull_helper import DockerImage, get_image_with_version
-from env_helper import TEMP_PATH, REPO_COPY, REPORTS_PATH
+from docker_images_helper import DockerImage, pull_image, get_docker_image
+from env_helper import REPORT_PATH, TEMP_PATH, REPO_COPY
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import TestResult, TestResults, read_test_results
@@ -126,12 +127,15 @@ def run_stress_test(docker_image_name: str) -> None:
 
     stopwatch = Stopwatch()
     temp_path = Path(TEMP_PATH)
+    reports_path = Path(REPORT_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
     repo_path = Path(REPO_COPY)
     repo_tests_path = repo_path / "tests"
-    reports_path = Path(REPORTS_PATH)
 
-    check_name = sys.argv[1]
+    check_name = sys.argv[1] if len(sys.argv) > 1 else os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
 
     pr_info = PRInfo()
 
@@ -143,7 +147,7 @@ def run_stress_test(docker_image_name: str) -> None:
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    docker_image = get_image_with_version(reports_path, docker_image_name)
+    docker_image = pull_image(get_docker_image(docker_image_name))
 
     packages_path = temp_path / "packages"
     packages_path.mkdir(parents=True, exist_ok=True)
@@ -212,7 +216,9 @@ def run_stress_test(docker_image_name: str) -> None:
     )
     print(f"::notice ::Report url: {report_url}")
 
-    post_commit_status(commit, state, report_url, description, check_name, pr_info)
+    post_commit_status(
+        commit, state, report_url, description, check_name, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/style_check.py b/tests/ci/style_check.py
index a006e01ff6b..b37dcb59237 100644
--- a/tests/ci/style_check.py
+++ b/tests/ci/style_check.py
@@ -9,22 +9,18 @@ import sys
 from pathlib import Path
 from typing import List, Tuple
 
-
-from clickhouse_helper import (
-    ClickHouseHelper,
-    prepare_tests_results_for_clickhouse,
-)
+from clickhouse_helper import ClickHouseHelper, prepare_tests_results_for_clickhouse
 from commit_status_helper import (
     RerunHelper,
     get_commit,
     post_commit_status,
     update_mergeable_check,
 )
-from docker_pull_helper import get_image_with_version
-from env_helper import REPO_COPY, REPORTS_PATH, TEMP_PATH
+from docker_images_helper import get_docker_image, pull_image
+from env_helper import REPO_COPY, TEMP_PATH
 from get_robot_token import get_best_robot_token
+from git_helper import GIT_PREFIX, git_runner
 from github_helper import GitHub
-from git_helper import git_runner
 from pr_info import PRInfo
 from report import TestResults, read_test_results
 from s3_helper import S3Helper
@@ -34,13 +30,6 @@ from upload_result_helper import upload_results
 
 NAME = "Style Check"
 
-GIT_PREFIX = (  # All commits to remote are done as robot-clickhouse
-    "git -c user.email=robot-clickhouse@users.noreply.github.com "
-    "-c user.name=robot-clickhouse -c commit.gpgsign=false "
-    "-c core.sshCommand="
-    "'ssh -o UserKnownHostsFile=/dev/null -o StrictHostKeyChecking=no'"
-)
-
 
 def process_result(
     result_directory: Path,
@@ -132,6 +121,15 @@ def commit_push_staged(pr_info: PRInfo) -> None:
         git_runner(push_cmd)
 
 
+def checkout_last_ref(pr_info: PRInfo) -> None:
+    # Checkout the merge commit back to avoid special effects
+    assert pr_info.number
+    if not pr_info.head_name == pr_info.base_name:
+        # We can't push to forks, sorry folks
+        return
+    git_runner("git checkout -f -")
+
+
 def main():
     logging.basicConfig(level=logging.INFO)
     logging.getLogger("git_helper").setLevel(logging.DEBUG)
@@ -142,17 +140,12 @@ def main():
     repo_path = Path(REPO_COPY)
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
-    reports_path = Path(REPORTS_PATH)
-    reports_path.mkdir(parents=True, exist_ok=True)
 
     pr_info = PRInfo()
-    if args.push:
-        checkout_head(pr_info)
-
     gh = GitHub(get_best_robot_token(), create_cache_dir=False)
     commit = get_commit(gh, pr_info.sha)
 
-    atexit.register(update_mergeable_check, gh, pr_info, NAME)
+    atexit.register(update_mergeable_check, commit, pr_info, NAME)
 
     rerun_helper = RerunHelper(commit, NAME)
     if rerun_helper.is_already_finished_by_status():
@@ -163,15 +156,19 @@ def main():
         code = int(state != "success")
         sys.exit(code)
 
-    docker_image = get_image_with_version(reports_path, "clickhouse/style-test")
     s3_helper = S3Helper()
 
+    IMAGE_NAME = "clickhouse/style-test"
+    image = pull_image(get_docker_image(IMAGE_NAME))
     cmd = (
         f"docker run -u $(id -u ${{USER}}):$(id -g ${{USER}}) --cap-add=SYS_PTRACE "
         f"--volume={repo_path}:/ClickHouse --volume={temp_path}:/test_output "
-        f"{docker_image}"
+        f"{image}"
     )
 
+    if args.push:
+        checkout_head(pr_info)
+
     logging.info("Is going to run the command: %s", cmd)
     subprocess.check_call(
         cmd,
@@ -180,6 +177,7 @@ def main():
 
     if args.push:
         commit_push_staged(pr_info)
+        checkout_last_ref(pr_info)
 
     state, description, test_results, additional_files = process_result(temp_path)
     ch_helper = ClickHouseHelper()
@@ -188,7 +186,9 @@ def main():
         s3_helper, pr_info.number, pr_info.sha, test_results, additional_files, NAME
     )
     print(f"::notice ::Report url: {report_url}")
-    post_commit_status(commit, state, report_url, description, NAME, pr_info)
+    post_commit_status(
+        commit, state, report_url, description, NAME, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/test_digest.py b/tests/ci/test_digest.py
index 278b2712917..86ba16ec525 100644
--- a/tests/ci/test_digest.py
+++ b/tests/ci/test_digest.py
@@ -38,35 +38,6 @@ class TestDigests(unittest.TestCase):
         dh._digest_file(self.tests_dir / "symlink-12", hash_tested)
         self.assertEqual(hash_expected.digest(), hash_tested.digest())
 
-    def test__digest_directory(self):
-        hash_tested = md5()
-        with self.assertRaises(
-            AssertionError, msg="_digest_directory shouldn't work with files"
-        ):
-            dh._digest_directory(self.tests_dir / "12", hash_tested)
-        with self.assertRaises(
-            AssertionError, msg="_digest_directory shouldn't work with broken links"
-        ):
-            dh._digest_file(self.broken_link, hash_tested)
-
-        # dir1
-        hash_expected = md5()
-        hash_expected.update(_12 + _14)
-        dh._digest_directory(self.tests_dir / "dir1", hash_tested)
-        self.assertEqual(hash_expected.digest(), hash_tested.digest())
-
-        # dir2 contains 12 and 13
-        hash_expected = md5()
-        hash_expected.update(_12 + _13)
-        hash_tested = md5()
-        dh._digest_directory(self.tests_dir / "dir2", hash_tested)
-        self.assertEqual(hash_expected.digest(), hash_tested.digest())
-
-        # dir3 is symlink to dir2
-        hash_tested = md5()
-        dh._digest_directory(self.tests_dir / "dir3", hash_tested)
-        self.assertEqual(hash_expected.digest(), hash_tested.digest())
-
     def test_digest_path(self):
         # test broken link does nothing
         self.assertEqual(
@@ -105,7 +76,7 @@ class TestDigests(unittest.TestCase):
         hash_expected = md5()
         hash_expected.update(_12 * 2 + _14 + (_12 + _13) * 2 + _12)
         self.assertEqual(
-            hash_expected.digest(), dh.digest_path(self.tests_dir).digest()
+            hash_expected.hexdigest(), dh.digest_path(self.tests_dir).hexdigest()
         )
 
     def test_digest_paths(self):
@@ -119,19 +90,9 @@ class TestDigests(unittest.TestCase):
         hash_unordered = dh.digest_paths(
             (self.tests_dir / d for d in ("dir3", "dir1", "dir2"))
         )
-        self.assertNotEqual(hash_ordered.digest(), hash_unordered.digest())
-        self.assertNotEqual(hash_ordered.digest(), hash_reversed.digest())
-        self.assertNotEqual(hash_unordered.digest(), hash_reversed.digest())
-
-    def test_digest_consistent_paths(self):
-        # test paths order does not matter
-        hash_ordered = dh.digest_consistent_paths(
-            (self.tests_dir / d for d in ("dir1", "dir2", "dir3"))
-        )
-        hash_reversed = dh.digest_consistent_paths(
-            (self.tests_dir / d for d in ("dir3", "dir2", "dir1"))
-        )
+        self.assertEqual(hash_ordered.digest(), hash_unordered.digest())
         self.assertEqual(hash_ordered.digest(), hash_reversed.digest())
+        self.assertEqual(hash_unordered.digest(), hash_reversed.digest())
 
     @classmethod
     def setUpClass(cls):
diff --git a/tests/ci/test_docker.py b/tests/ci/test_docker.py
index 8aab50ed082..662143bfd9b 100644
--- a/tests/ci/test_docker.py
+++ b/tests/ci/test_docker.py
@@ -2,13 +2,6 @@
 
 import unittest
 from unittest.mock import patch, MagicMock
-from pathlib import Path
-
-from env_helper import GITHUB_RUN_URL
-from pr_info import PRInfo
-from report import TestResult
-import docker_images_check as di
-from docker_images_helper import get_images_dict
 
 from version_helper import get_version_from_string
 import docker_server as ds
@@ -16,257 +9,6 @@ import docker_server as ds
 # di.logging.basicConfig(level=di.logging.INFO)
 
 
-class TestDockerImageCheck(unittest.TestCase):
-    def test_get_changed_docker_images(self):
-        pr_info = PRInfo(PRInfo.default_event.copy())
-        pr_info.changed_files = {
-            "docker/test/stateless",
-            "docker/test/base",
-            "docker/docs/builder",
-        }
-        images = sorted(
-            list(
-                di.get_changed_docker_images(
-                    pr_info,
-                    get_images_dict(
-                        Path(__file__).parent,
-                        Path("tests/docker_images_for_tests.json"),
-                    ),
-                )
-            )
-        )
-        self.maxDiff = None
-        expected = sorted(
-            [
-                di.DockerImage("docker/test/base", "clickhouse/test-base", False),
-                di.DockerImage("docker/docs/builder", "clickhouse/docs-builder", True),
-                di.DockerImage(
-                    "docker/test/sqltest",
-                    "clickhouse/sqltest",
-                    False,
-                    "clickhouse/test-base",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/test/stateless",
-                    "clickhouse/stateless-test",
-                    False,
-                    "clickhouse/test-base",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/test/integration/base",
-                    "clickhouse/integration-test",
-                    False,
-                    "clickhouse/test-base",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/test/fuzzer",
-                    "clickhouse/fuzzer",
-                    False,
-                    "clickhouse/test-base",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/test/keeper-jepsen",
-                    "clickhouse/keeper-jepsen-test",
-                    False,
-                    "clickhouse/test-base",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/docs/check",
-                    "clickhouse/docs-check",
-                    False,
-                    "clickhouse/docs-builder",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/docs/release",
-                    "clickhouse/docs-release",
-                    False,
-                    "clickhouse/docs-builder",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/test/stateful",
-                    "clickhouse/stateful-test",
-                    False,
-                    "clickhouse/stateless-test",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/test/unit",
-                    "clickhouse/unit-test",
-                    False,
-                    "clickhouse/stateless-test",  # type: ignore
-                ),
-                di.DockerImage(
-                    "docker/test/stress",
-                    "clickhouse/stress-test",
-                    False,
-                    "clickhouse/stateful-test",  # type: ignore
-                ),
-            ]
-        )
-        self.assertEqual(images, expected)
-
-    def test_gen_version(self):
-        pr_info = PRInfo(PRInfo.default_event.copy())
-        pr_info.base_ref = "anything-else"
-        versions, result_version = di.gen_versions(pr_info, None)
-        self.assertEqual(versions, ["0", "0-HEAD"])
-        self.assertEqual(result_version, "0-HEAD")
-        pr_info.base_ref = "master"
-        versions, result_version = di.gen_versions(pr_info, None)
-        self.assertEqual(versions, ["latest", "0", "0-HEAD"])
-        self.assertEqual(result_version, "0-HEAD")
-        versions, result_version = di.gen_versions(pr_info, "suffix")
-        self.assertEqual(versions, ["latest-suffix", "0-suffix", "0-HEAD-suffix"])
-        self.assertEqual(result_version, versions)
-        pr_info.number = 1
-        versions, result_version = di.gen_versions(pr_info, None)
-        self.assertEqual(versions, ["1", "1-HEAD"])
-        self.assertEqual(result_version, "1-HEAD")
-
-    @patch("docker_images_check.TeePopen")
-    @patch("platform.machine")
-    def test_build_and_push_one_image(self, mock_machine, mock_popen):
-        mock_popen.return_value.__enter__.return_value.wait.return_value = 0
-        image = di.DockerImage("path", "name", False, gh_repo="")
-
-        result, _ = di.build_and_push_one_image(image, "version", [], True, True)
-        mock_popen.assert_called_once()
-        mock_machine.assert_not_called()
-        self.assertIn(
-            f"docker buildx build --builder default --label build-url={GITHUB_RUN_URL} "
-            "--build-arg FROM_TAG=version "
-            f"--build-arg CACHE_INVALIDATOR={GITHUB_RUN_URL} "
-            "--tag name:version --cache-from type=registry,ref=name:version "
-            "--cache-from type=registry,ref=name:latest "
-            "--cache-to type=inline,mode=max --push --progress plain path",
-            mock_popen.call_args.args,
-        )
-        self.assertTrue(result)
-        mock_popen.reset_mock()
-        mock_machine.reset_mock()
-
-        mock_popen.return_value.__enter__.return_value.wait.return_value = 0
-        result, _ = di.build_and_push_one_image(image, "version2", [], False, True)
-        mock_popen.assert_called_once()
-        mock_machine.assert_not_called()
-        self.assertIn(
-            f"docker buildx build --builder default --label build-url={GITHUB_RUN_URL} "
-            "--build-arg FROM_TAG=version2 "
-            f"--build-arg CACHE_INVALIDATOR={GITHUB_RUN_URL} "
-            "--tag name:version2 --cache-from type=registry,ref=name:version2 "
-            "--cache-from type=registry,ref=name:latest "
-            "--cache-to type=inline,mode=max --progress plain path",
-            mock_popen.call_args.args,
-        )
-        self.assertTrue(result)
-
-        mock_popen.reset_mock()
-        mock_machine.reset_mock()
-        mock_popen.return_value.__enter__.return_value.wait.return_value = 1
-        result, _ = di.build_and_push_one_image(image, "version2", [], False, False)
-        mock_popen.assert_called_once()
-        mock_machine.assert_not_called()
-        self.assertIn(
-            f"docker buildx build --builder default --label build-url={GITHUB_RUN_URL} "
-            f"--build-arg CACHE_INVALIDATOR={GITHUB_RUN_URL} "
-            "--tag name:version2 --cache-from type=registry,ref=name:version2 "
-            "--cache-from type=registry,ref=name:latest "
-            "--cache-to type=inline,mode=max --progress plain path",
-            mock_popen.call_args.args,
-        )
-        self.assertFalse(result)
-
-        mock_popen.reset_mock()
-        mock_machine.reset_mock()
-        mock_popen.return_value.__enter__.return_value.wait.return_value = 1
-        result, _ = di.build_and_push_one_image(
-            image, "version2", ["cached-version", "another-cached"], False, False
-        )
-        mock_popen.assert_called_once()
-        mock_machine.assert_not_called()
-        self.assertIn(
-            f"docker buildx build --builder default --label build-url={GITHUB_RUN_URL} "
-            f"--build-arg CACHE_INVALIDATOR={GITHUB_RUN_URL} "
-            "--tag name:version2 --cache-from type=registry,ref=name:version2 "
-            "--cache-from type=registry,ref=name:latest "
-            "--cache-from type=registry,ref=name:cached-version "
-            "--cache-from type=registry,ref=name:another-cached "
-            "--cache-to type=inline,mode=max --progress plain path",
-            mock_popen.call_args.args,
-        )
-        self.assertFalse(result)
-
-        mock_popen.reset_mock()
-        mock_machine.reset_mock()
-        only_amd64_image = di.DockerImage("path", "name", True)
-        mock_popen.return_value.__enter__.return_value.wait.return_value = 0
-
-        result, _ = di.build_and_push_one_image(
-            only_amd64_image, "version", [], True, True
-        )
-        mock_popen.assert_called_once()
-        mock_machine.assert_called_once()
-        self.assertIn(
-            "docker pull ubuntu:20.04; docker tag ubuntu:20.04 name:version; "
-            "docker push name:version",
-            mock_popen.call_args.args,
-        )
-        self.assertTrue(result)
-        result, _ = di.build_and_push_one_image(
-            only_amd64_image, "version", [], False, True
-        )
-        self.assertIn(
-            "docker pull ubuntu:20.04; docker tag ubuntu:20.04 name:version; ",
-            mock_popen.call_args.args,
-        )
-        with self.assertRaises(AssertionError):
-            result, _ = di.build_and_push_one_image(image, "version", [""], False, True)
-
-    @patch("docker_images_check.build_and_push_one_image")
-    def test_process_image_with_parents(self, mock_build):
-        mock_build.side_effect = lambda v, w, x, y, z: (True, Path(f"{v.repo}_{w}.log"))
-        im1 = di.DockerImage("path1", "repo1", False)
-        im2 = di.DockerImage("path2", "repo2", False, im1)
-        im3 = di.DockerImage("path3", "repo3", False, im2)
-        im4 = di.DockerImage("path4", "repo4", False, im1)
-        # We use list to have determined order of image builgings
-        images = [im4, im1, im3, im2, im1]
-        test_results = [
-            di.process_image_with_parents(im, ["v1", "v2", "latest"], [], True)
-            for im in images
-        ]
-        # The time is random, so we check it's not None and greater than 0,
-        # and then set to 1
-        for results in test_results:
-            for result in results:
-                self.assertIsNotNone(result.time)
-                self.assertGreater(result.time, 0)  # type: ignore
-                result.time = 1
-
-        self.maxDiff = None
-        expected = [
-            [  # repo4 -> repo1
-                TestResult("repo1:v1", "OK", 1, [Path("repo1_v1.log")]),
-                TestResult("repo1:v2", "OK", 1, [Path("repo1_v2.log")]),
-                TestResult("repo1:latest", "OK", 1, [Path("repo1_latest.log")]),
-                TestResult("repo4:v1", "OK", 1, [Path("repo4_v1.log")]),
-                TestResult("repo4:v2", "OK", 1, [Path("repo4_v2.log")]),
-                TestResult("repo4:latest", "OK", 1, [Path("repo4_latest.log")]),
-            ],
-            [],  # repo1 is built
-            [  # repo3 -> repo2 -> repo1
-                TestResult("repo2:v1", "OK", 1, [Path("repo2_v1.log")]),
-                TestResult("repo2:v2", "OK", 1, [Path("repo2_v2.log")]),
-                TestResult("repo2:latest", "OK", 1, [Path("repo2_latest.log")]),
-                TestResult("repo3:v1", "OK", 1, [Path("repo3_v1.log")]),
-                TestResult("repo3:v2", "OK", 1, [Path("repo3_v2.log")]),
-                TestResult("repo3:latest", "OK", 1, [Path("repo3_latest.log")]),
-            ],
-            [],  # repo2 -> repo1 are built
-            [],  # repo1 is built
-        ]
-        self.assertEqual(test_results, expected)
-
-
 class TestDockerServer(unittest.TestCase):
     def test_gen_tags(self):
         version = get_version_from_string("22.2.2.2")
diff --git a/tests/ci/unit_tests_check.py b/tests/ci/unit_tests_check.py
index b9fdddfe74b..f1238a00bd4 100644
--- a/tests/ci/unit_tests_check.py
+++ b/tests/ci/unit_tests_check.py
@@ -22,8 +22,8 @@ from commit_status_helper import (
     post_commit_status,
     update_mergeable_check,
 )
-from docker_pull_helper import get_image_with_version
-from env_helper import TEMP_PATH, REPORTS_PATH
+from docker_images_helper import pull_image, get_docker_image
+from env_helper import REPORT_PATH, TEMP_PATH
 from get_robot_token import get_best_robot_token
 from pr_info import PRInfo
 from report import ERROR, FAILURE, FAIL, OK, SUCCESS, TestResults, TestResult
@@ -174,7 +174,10 @@ def main():
 
     stopwatch = Stopwatch()
 
-    check_name = sys.argv[1]
+    check_name = sys.argv[1] if len(sys.argv) > 1 else os.getenv("CHECK_NAME")
+    assert (
+        check_name
+    ), "Check name must be provided as an input arg or in CHECK_NAME env"
 
     temp_path = Path(TEMP_PATH)
     temp_path.mkdir(parents=True, exist_ok=True)
@@ -184,16 +187,16 @@ def main():
     gh = Github(get_best_robot_token(), per_page=100)
     commit = get_commit(gh, pr_info.sha)
 
-    atexit.register(update_mergeable_check, gh, pr_info, check_name)
+    atexit.register(update_mergeable_check, commit, pr_info, check_name)
 
     rerun_helper = RerunHelper(commit, check_name)
     if rerun_helper.is_already_finished_by_status():
         logging.info("Check is already finished according to github status, exiting")
         sys.exit(0)
 
-    docker_image = get_image_with_version(REPORTS_PATH, IMAGE_NAME)
+    docker_image = pull_image(get_docker_image(IMAGE_NAME))
 
-    download_unit_tests(check_name, REPORTS_PATH, TEMP_PATH)
+    download_unit_tests(check_name, REPORT_PATH, TEMP_PATH)
 
     tests_binary = temp_path / "unit_tests_dbms"
     os.chmod(tests_binary, 0o777)
@@ -233,7 +236,9 @@ def main():
         check_name,
     )
     print(f"::notice ::Report url: {report_url}")
-    post_commit_status(commit, state, report_url, description, check_name, pr_info)
+    post_commit_status(
+        commit, state, report_url, description, check_name, pr_info, dump_to_file=True
+    )
 
     prepared_events = prepare_tests_results_for_clickhouse(
         pr_info,
diff --git a/tests/ci/worker/dockerhub_proxy_template.sh b/tests/ci/worker/dockerhub_proxy_template.sh
index 38f2bc6486a..7ca8d581df5 100644
--- a/tests/ci/worker/dockerhub_proxy_template.sh
+++ b/tests/ci/worker/dockerhub_proxy_template.sh
@@ -15,6 +15,19 @@ if [[ "$ETH_DNS" ]] && [[ "${ETH_DNS#*: }" != *"$CLOUDFLARE_NS"* ]]; then
   resolvectl dns "$IFACE" "${new_dns[@]}"
 fi
 
+# tune sysctl for network performance
+cat > /etc/sysctl.d/10-network-memory.conf << EOF
+net.core.netdev_max_backlog=2000
+net.core.rmem_max=1048576
+net.core.wmem_max=1048576
+net.ipv4.tcp_max_syn_backlog=1024
+net.ipv4.tcp_rmem=4096 131072  16777216
+net.ipv4.tcp_wmem=4096 87380   16777216
+net.ipv4.tcp_mem=4096  131072  16777216
+EOF
+
+sysctl -p /etc/sysctl.d/10-network-memory.conf
+
 mkdir /home/ubuntu/registrystorage
 
 sed -i 's/preserve_hostname: false/preserve_hostname: true/g' /etc/cloud/cloud.cfg
@@ -22,4 +35,11 @@ sed -i 's/preserve_hostname: false/preserve_hostname: true/g' /etc/cloud/cloud.c
 REGISTRY_PROXY_USERNAME=robotclickhouse
 REGISTRY_PROXY_PASSWORD=$(aws ssm get-parameter --name dockerhub_robot_password --with-decryption | jq '.Parameter.Value' -r)
 
-docker run -d --network=host -p 5000:5000 -v /home/ubuntu/registrystorage:/var/lib/registry -e REGISTRY_HTTP_ADDR=0.0.0.0:5000 -e REGISTRY_STORAGE_DELETE_ENABLED=true -e REGISTRY_PROXY_REMOTEURL=https://registry-1.docker.io -e REGISTRY_PROXY_PASSWORD="$REGISTRY_PROXY_PASSWORD" -e REGISTRY_PROXY_USERNAME="$REGISTRY_PROXY_USERNAME" --restart=always --name registry registry:2
+docker run -d --network=host -p 5000:5000 -v /home/ubuntu/registrystorage:/var/lib/registry \
+  -e REGISTRY_STORAGE_CACHE='' \
+  -e REGISTRY_HTTP_ADDR=0.0.0.0:5000 \
+  -e REGISTRY_STORAGE_DELETE_ENABLED=true \
+  -e REGISTRY_PROXY_REMOTEURL=https://registry-1.docker.io \
+  -e REGISTRY_PROXY_PASSWORD="$REGISTRY_PROXY_PASSWORD" \
+  -e REGISTRY_PROXY_USERNAME="$REGISTRY_PROXY_USERNAME" \
+  --restart=always --name registry registry:2
diff --git a/tests/ci/workflow_jobs_lambda/app.py b/tests/ci/workflow_jobs_lambda/app.py
index c624a492604..4210ca22da9 100644
--- a/tests/ci/workflow_jobs_lambda/app.py
+++ b/tests/ci/workflow_jobs_lambda/app.py
@@ -8,11 +8,11 @@ Then it either posts it as is to the play.clickhouse.com, or anonymizes the sens
 fields for private repositories
 """
 
+import json
+import logging
 from base64 import b64decode
 from dataclasses import dataclass
 from typing import Any, List, Optional
-import json
-import logging
 
 from lambda_shared import ClickHouseHelper, InsertException, get_parameter_from_ssm
 
@@ -126,6 +126,20 @@ def send_event_workflow_job(workflow_job: WorkflowJob) -> None:
         )
 
 
+def killed_job(wf_job: dict) -> bool:
+    """a hack to identify the killed runner if "Complete job" is omit"""
+    if (
+        wf_job.get("status", "") != "completed"
+        or wf_job.get("conclusion", "") != "failure"
+    ):
+        # The task either success or in progress
+        return False
+    return not any(
+        step["name"] == "Complete job" and step["conclusion"] is not None
+        for step in wf_job["steps"]
+    )
+
+
 def handler(event: dict, context: Any) -> dict:
     if event["isBase64Encoded"]:
         event_data = json.loads(b64decode(event["body"]))
@@ -141,8 +155,12 @@ def handler(event: dict, context: Any) -> dict:
         logging.error("The event data: %s", event)
         logging.error("The context data: %s", context)
 
-    # We record only finished steps
-    steps = len([step for step in wf_job["steps"] if step["conclusion"] is not None])
+    if killed_job(wf_job):
+        # for killed job we record 0
+        steps = 0
+    else:
+        # We record only finished steps
+        steps = sum(1 for st in wf_job["steps"] if st["conclusion"] is not None)
 
     workflow_job = WorkflowJob(
         wf_job["id"],
diff --git a/tests/clickhouse-test b/tests/clickhouse-test
index 115e5ac7ba3..c7049b0e0c8 100755
--- a/tests/clickhouse-test
+++ b/tests/clickhouse-test
@@ -32,7 +32,7 @@ from typing import Tuple, Union, Optional, Dict, Set, List
 import subprocess
 from subprocess import Popen
 from subprocess import PIPE
-from datetime import datetime
+from datetime import datetime, timedelta
 from time import time, sleep
 from errno import ESRCH
 
@@ -279,36 +279,42 @@ def need_retry(args, stdout, stderr, total_time):
     )
 
 
-def get_processlist_with_stacktraces(args):
-    try:
-        if args.replicated_database:
-            return clickhouse_execute(
+def get_processlist_size(args):
+    if args.replicated_database:
+        return int(
+            clickhouse_execute(
                 args,
                 """
-            SELECT materialize(hostName() || '::' || tcpPort()::String) as host_port, *
-            -- NOTE: view() here to do JOIN on shards, instead of initiator
-            FROM clusterAllReplicas('test_cluster_database_replicated', view(
                 SELECT
-                    p.*,
-                    arrayStringConcat(groupArray('Thread ID ' || toString(s.thread_id) || '\n' || arrayStringConcat(arrayMap(
-                        x -> concat(addressToLine(x), '::', demangle(addressToSymbol(x))),
-                        s.trace), '\n') AS stacktrace
-                    )) AS stacktraces
-                FROM system.processes p
-                JOIN system.stack_trace s USING (query_id)
+                    count()
+                FROM
+                    FROM system.processes
                 WHERE query NOT LIKE '%system.processes%'
-                GROUP BY p.*
-            ))
-            ORDER BY elapsed DESC FORMAT Vertical
-            """,
-                settings={
-                    "allow_introspection_functions": 1,
-                },
-            )
-        else:
-            return clickhouse_execute(
+                """,
+            ).strip()
+        )
+    else:
+        return int(
+            clickhouse_execute(
                 args,
                 """
+                SELECT
+                    count()
+                FROM system.processes
+                WHERE query NOT LIKE '%system.processes%'
+                """,
+            ).strip()
+        )
+
+
+def get_processlist_with_stacktraces(args):
+    if args.replicated_database:
+        return clickhouse_execute(
+            args,
+            """
+        SELECT materialize(hostName() || '::' || tcpPort()::String) as host_port, *
+        -- NOTE: view() here to do JOIN on shards, instead of initiator
+        FROM clusterAllReplicas('test_cluster_database_replicated', view(
             SELECT
                 p.*,
                 arrayStringConcat(groupArray('Thread ID ' || toString(s.thread_id) || '\n' || arrayStringConcat(arrayMap(
@@ -319,14 +325,35 @@ def get_processlist_with_stacktraces(args):
             JOIN system.stack_trace s USING (query_id)
             WHERE query NOT LIKE '%system.processes%'
             GROUP BY p.*
-            ORDER BY elapsed DESC FORMAT Vertical
-            """,
-                settings={
-                    "allow_introspection_functions": 1,
-                },
-            )
-    except Exception as e:
-        return "Failed to get processlist: " + str(e)
+        ))
+        ORDER BY elapsed DESC FORMAT Vertical
+        """,
+            settings={
+                "allow_introspection_functions": 1,
+            },
+            timeout=120,
+        )
+    else:
+        return clickhouse_execute(
+            args,
+            """
+        SELECT
+            p.*,
+            arrayStringConcat(groupArray('Thread ID ' || toString(s.thread_id) || '\n' || arrayStringConcat(arrayMap(
+                x -> concat(addressToLine(x), '::', demangle(addressToSymbol(x))),
+                s.trace), '\n') AS stacktrace
+            )) AS stacktraces
+        FROM system.processes p
+        JOIN system.stack_trace s USING (query_id)
+        WHERE query NOT LIKE '%system.processes%'
+        GROUP BY p.*
+        ORDER BY elapsed DESC FORMAT Vertical
+        """,
+            settings={
+                "allow_introspection_functions": 1,
+            },
+            timeout=120,
+        )
 
 
 def get_transactions_list(args):
@@ -504,6 +531,7 @@ class FailureReason(enum.Enum):
     FAST_ONLY = "running fast tests only"
     NO_LONG = "not running long tests"
     REPLICATED_DB = "replicated-database"
+    NON_ATOMIC_DB = "database engine not Atomic"
     S3_STORAGE = "s3-storage"
     BUILD = "not running for current build"
     NO_PARALLEL_REPLICAS = "smth in not supported with parallel replicas"
@@ -555,8 +583,12 @@ class SettingsRandomizer:
         "prefer_localhost_replica": lambda: random.randint(0, 1),
         "max_block_size": lambda: random.randint(8000, 100000),
         "max_threads": lambda: random.randint(1, 64),
-        "optimize_or_like_chain": lambda: random.randint(0, 1),
+        "optimize_append_index": lambda: random.randint(0, 1),
+        "optimize_if_chain_to_multiif": lambda: random.randint(0, 1),
+        "optimize_if_transform_strings_to_enum": lambda: random.randint(0, 1),
         "optimize_read_in_order": lambda: random.randint(0, 1),
+        "optimize_or_like_chain": lambda: random.randint(0, 1),
+        "optimize_substitute_columns": lambda: random.randint(0, 1),
         "enable_multiple_prewhere_read_steps": lambda: random.randint(0, 1),
         "read_in_order_two_level_merge_threshold": lambda: random.randint(0, 100),
         "optimize_aggregation_in_order": lambda: random.randint(0, 1),
@@ -607,6 +639,13 @@ class SettingsRandomizer:
         "compile_sort_description": lambda: random.randint(0, 1),
         "merge_tree_coarse_index_granularity": lambda: random.randint(2, 32),
         "optimize_distinct_in_order": lambda: random.randint(0, 1),
+        "max_bytes_before_external_sort": threshold_generator(
+            0.3, 0.5, 1, 10 * 1024 * 1024 * 1024
+        ),
+        "max_bytes_before_external_group_by": threshold_generator(
+            0.3, 0.5, 1, 10 * 1024 * 1024 * 1024
+        ),
+        "max_bytes_before_remerge_sort": lambda: random.randint(1, 3000000000),
         "optimize_sorting_by_input_stream_properties": lambda: random.randint(0, 1),
         "http_response_buffer_size": lambda: random.randint(0, 10 * 1048576),
         "http_wait_end_of_query": lambda: random.random() > 0.5,
@@ -959,6 +998,13 @@ class TestCase:
         elif tags and ("no-replicated-database" in tags) and args.replicated_database:
             return FailureReason.REPLICATED_DB
 
+        elif (
+            tags
+            and ("atomic-database" in tags)
+            and (args.replicated_database or args.db_engine not in (None, "Atomic"))
+        ):
+            return FailureReason.NON_ATOMIC_DB
+
         elif tags and ("no-s3-storage" in tags) and args.s3_storage:
             return FailureReason.S3_STORAGE
         elif (
@@ -993,7 +1039,24 @@ class TestCase:
         if proc:
             if proc.returncode is None:
                 try:
-                    proc.kill()
+                    pgid = os.getpgid(proc.pid)
+                    # NOTE: this still may leave some processes, that had been
+                    # created by timeout(1), since it also creates new process
+                    # group. But this should not be a problem with default
+                    # options, since the default time for each test is 10min,
+                    # and this is way more bigger then the timeout for each
+                    # timeout(1) invocation.
+                    #
+                    # But as a workaround we are sending SIGTERM first, and
+                    # only after SIGKILL, that way timeout(1) will have an
+                    # ability to terminate childrens (though not always since
+                    # signals are asynchronous).
+                    os.killpg(pgid, signal.SIGTERM)
+                    # This may not be enough, but this is at least something
+                    # (and anyway it is OK to spend 0.1 second more in case of
+                    # test timeout).
+                    sleep(0.1)
+                    os.killpg(pgid, signal.SIGKILL)
                 except OSError as e:
                     if e.errno != ESRCH:
                         raise
@@ -1269,7 +1332,7 @@ class TestCase:
 
         command = pattern.format(**params)
 
-        proc = Popen(command, shell=True, env=os.environ)
+        proc = Popen(command, shell=True, env=os.environ, start_new_session=True)
 
         while (
             datetime.now() - start_time
@@ -2205,7 +2268,7 @@ def reportLogStats(args):
         GROUP BY message_format_string
         ORDER BY count DESC
         LIMIT 100
-        FORMAT TSVWithNamesAndTypes
+        FORMAT PrettySpaceNoEscapes
     """
     value = clickhouse_execute(args, query).decode(errors="replace")
     print("\nTop patterns of log messages:\n")
@@ -2225,7 +2288,7 @@ def reportLogStats(args):
         GROUP BY pattern
         ORDER BY count DESC
         LIMIT 30
-        FORMAT TSVWithNamesAndTypes
+        FORMAT PrettySpaceNoEscapes
     """
     value = clickhouse_execute(args, query).decode(errors="replace")
     print("\nTop messages without format string (fmt::runtime):\n")
@@ -2238,10 +2301,10 @@ def reportLogStats(args):
         WHERE (now() - toIntervalMinute(240)) < event_time
         AND (message NOT LIKE (replaceRegexpAll(message_format_string, '{[:.0-9dfx]*}', '%') AS s))
         AND (message NOT LIKE concat('%Exception: ', s, '%'))
-        GROUP BY message_format_string ORDER BY count() DESC LIMIT 20 FORMAT TSVWithNamesAndTypes
+        GROUP BY message_format_string ORDER BY count() DESC LIMIT 20 FORMAT PrettySpaceNoEscapes
     """
     value = clickhouse_execute(args, query).decode(errors="replace")
-    print("\nTop messages that does not match its format string:\n")
+    print("\nTop messages not matching their format strings:\n")
     print(value)
     print("\n")
 
@@ -2269,13 +2332,13 @@ def reportLogStats(args):
               'Attempt to read after eof', 'String size is too big ({}), maximum: {}'
         ) AS known_short_messages
         SELECT count() AS c, message_format_string, substr(any(message), 1, 120),
-            min(if(length(regexpExtract(message, '(.*)\\([A-Z0-9_]+\\)')) as pref > 0, pref, length(message)) - 26 AS length_without_exception_boilerplate) AS min_length_without_exception_boilerplate
+            min(if(length(regexpExtract(message, '(.*)\\([A-Z0-9_]+\\)')) as prefix_len > 0, prefix_len, length(message)) - 26 AS length_without_exception_boilerplate) AS min_length_without_exception_boilerplate
         FROM system.text_log
         WHERE (now() - toIntervalMinute(240)) < event_time
             AND (length(message_format_string) < 16
-                OR (message ilike '%DB::Exception%' AND length_without_exception_boilerplate < 30))
+                OR (message ILIKE '%DB::Exception%' AND length_without_exception_boilerplate < 30))
             AND message_format_string NOT IN known_short_messages
-        GROUP BY message_format_string ORDER BY c DESC LIMIT 50 FORMAT TSVWithNamesAndTypes
+        GROUP BY message_format_string ORDER BY c DESC LIMIT 50 FORMAT PrettySpaceNoEscapes
     """
     value = clickhouse_execute(args, query).decode(errors="replace")
     print("\nTop short messages:\n")
@@ -2416,11 +2479,42 @@ def main(args):
 
     if args.hung_check:
         # Some queries may execute in background for some time after test was finished. This is normal.
-        for _ in range(1, 60):
-            processlist = get_processlist_with_stacktraces(args)
-            if not processlist:
-                break
-            sleep(1)
+        print("Checking the hung queries: ", end="")
+        hung_count = 0
+        try:
+            deadline = datetime.now() + timedelta(seconds=90)
+            while datetime.now() < deadline:
+                hung_count = get_processlist_size(args)
+                if hung_count == 0:
+                    print(" done")
+                    break
+                print(". ", end="")
+        except Exception as e:
+            print(
+                colored(
+                    "\nHung check failed. Failed to get processlist size: " + str(e),
+                    args,
+                    "red",
+                    attrs=["bold"],
+                )
+            )
+            exit_code.value = 1
+
+        processlist = ""
+        if hung_count > 0:
+            try:
+                processlist = get_processlist_with_stacktraces(args)
+            except Exception as e:
+                print(
+                    colored(
+                        "\nHung check failed. Failed to get processlist with stacktraces: "
+                        + str(e),
+                        args,
+                        "red",
+                        attrs=["bold"],
+                    )
+                )
+                exit_code.value = 1
 
         if processlist:
             print(
diff --git a/tests/config/config.d/forbidden_get_client_http_headers.xml b/tests/config/config.d/forbidden_get_client_http_headers.xml
deleted file mode 100644
index cfecb015260..00000000000
--- a/tests/config/config.d/forbidden_get_client_http_headers.xml
+++ /dev/null
@@ -1,4 +0,0 @@
-<clickhouse>
-    <get_client_http_header_forbidden_headers>FORBIDDEN-KEY1,FORBIDDEN-KEY2</get_client_http_header_forbidden_headers>    
-    <allow_get_client_http_header>1</allow_get_client_http_header>
-</clickhouse>
diff --git a/tests/config/config.d/graphite_alternative.xml b/tests/config/config.d/graphite_alternative.xml
new file mode 100644
index 00000000000..1a00de52af5
--- /dev/null
+++ b/tests/config/config.d/graphite_alternative.xml
@@ -0,0 +1,29 @@
+<!-- alternative graphite config, for testing 02910_replicated_merge_parameters_must_consistent -->
+<clickhouse>
+    <graphite_rollup_alternative>
+        <version_column_name>Version</version_column_name>
+        <pattern>
+            <regexp>sum</regexp>
+            <function>any</function>
+            <retention>
+                <age>0</age>
+                <precision>600</precision>
+            </retention>
+            <retention>
+                <age>17280</age>
+                <precision>6000</precision>
+            </retention>
+        </pattern>
+        <default>
+            <function>any</function>
+            <retention>
+                <age>0</age>
+                <precision>600</precision>
+            </retention>
+            <retention>
+                <age>17280</age>
+                <precision>6000</precision>
+            </retention>
+        </default>
+    </graphite_rollup_alternative>
+</clickhouse>
diff --git a/tests/config/config.d/max_num_to_warn.xml b/tests/config/config.d/max_num_to_warn.xml
new file mode 100644
index 00000000000..77d68998f8e
--- /dev/null
+++ b/tests/config/config.d/max_num_to_warn.xml
@@ -0,0 +1,5 @@
+<clickhouse>
+    <max_table_num_to_warn>10</max_table_num_to_warn>
+    <max_database_num_to_warn>10</max_database_num_to_warn>
+    <max_part_num_to_warn>10</max_part_num_to_warn>
+</clickhouse>
diff --git a/tests/config/config.d/reverse_dns_query_function.xml b/tests/config/config.d/reverse_dns_query_function.xml
deleted file mode 100644
index 8cd7695b4d3..00000000000
--- a/tests/config/config.d/reverse_dns_query_function.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<clickhouse>
-    <allow_reverse_dns_query_function>1</allow_reverse_dns_query_function>
-</clickhouse>
\ No newline at end of file
diff --git a/tests/config/config.d/storage_conf.xml b/tests/config/config.d/storage_conf.xml
index d976e46ff7b..18652826d83 100644
--- a/tests/config/config.d/storage_conf.xml
+++ b/tests/config/config.d/storage_conf.xml
@@ -13,10 +13,22 @@
                 <type>cache</type>
                 <disk>s3_disk</disk>
                 <path>s3_cache/</path>
+                <max_size>64Mi</max_size>
+                <cache_on_write_operations>1</cache_on_write_operations>
+                <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
+                <cache_policy>LRU</cache_policy>
+                <slru_size_ratio>0.3</slru_size_ratio>
+            </s3_cache>
+            <s3_cache_02933>
+                <type>cache</type>
+                <disk>s3_disk</disk>
+                <path>s3_cache_02933/</path>
                 <max_size>128Mi</max_size>
                 <cache_on_write_operations>1</cache_on_write_operations>
                 <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
-            </s3_cache>
+                <background_download_threads>0</background_download_threads>
+                <background_download_queue_size_limit>0</background_download_queue_size_limit>
+            </s3_cache_02933>
             <!-- local disks -->
             <local_disk>
                 <type>local_blob_storage</type>
diff --git a/tests/config/config.d/storage_conf_02944.xml b/tests/config/config.d/storage_conf_02944.xml
new file mode 100644
index 00000000000..5f45640a923
--- /dev/null
+++ b/tests/config/config.d/storage_conf_02944.xml
@@ -0,0 +1,25 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <s3_disk_02944>
+                <type>s3</type>
+                <path>s3_disk/</path>
+                <endpoint>http://localhost:11111/test/test_02944/</endpoint>
+                <access_key_id>clickhouse</access_key_id>
+                <secret_access_key>clickhouse</secret_access_key>
+                <request_timeout_ms>20000</request_timeout_ms>
+            </s3_disk_02944>
+            <s3_cache_02944>
+                <type>cache</type>
+                <disk>s3_disk</disk>
+                <path>s3_cache_02944/</path>
+                <max_size>100</max_size>
+                <max_elements>10</max_elements>
+                <max_file_segment_size>10</max_file_segment_size>
+                <boundary_alignment>10</boundary_alignment>
+                <delayed_cleanup_interval_ms>100</delayed_cleanup_interval_ms>
+                <cache_on_write_operations>0</cache_on_write_operations>
+            </s3_cache_02944>
+        </disks>
+    </storage_configuration>
+</clickhouse>
diff --git a/tests/config/config.d/zero_copy_destructive_operations.xml b/tests/config/config.d/zero_copy_destructive_operations.xml
new file mode 100644
index 00000000000..20663137f7f
--- /dev/null
+++ b/tests/config/config.d/zero_copy_destructive_operations.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <merge_tree>
+        <disable_freeze_partition_for_zero_copy_replication>0</disable_freeze_partition_for_zero_copy_replication>
+        <disable_detach_partition_for_zero_copy_replication>0</disable_detach_partition_for_zero_copy_replication>
+        <disable_fetch_partition_for_zero_copy_replication>0</disable_fetch_partition_for_zero_copy_replication>
+    </merge_tree>
+</clickhouse>
diff --git a/tests/config/install.sh b/tests/config/install.sh
index ae2abc12b00..2f9fd44c9b0 100755
--- a/tests/config/install.sh
+++ b/tests/config/install.sh
@@ -15,8 +15,8 @@ mkdir -p $DEST_SERVER_PATH/config.d/
 mkdir -p $DEST_SERVER_PATH/users.d/
 mkdir -p $DEST_CLIENT_PATH
 
-ln -sf $SRC_PATH/config.d/forbidden_get_client_http_headers.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/zookeeper_write.xml $DEST_SERVER_PATH/config.d/
+ln -sf $SRC_PATH/config.d/max_num_to_warn.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/listen.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/text_log.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/blob_storage_log.xml $DEST_SERVER_PATH/config.d/
@@ -26,6 +26,7 @@ ln -sf $SRC_PATH/config.d/macros.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/secure_ports.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/clusters.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/graphite.xml $DEST_SERVER_PATH/config.d/
+ln -sf $SRC_PATH/config.d/graphite_alternative.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/database_atomic.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/max_concurrent_queries.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/merge_tree_settings.xml $DEST_SERVER_PATH/config.d/
@@ -62,6 +63,7 @@ ln -sf $SRC_PATH/config.d/enable_wait_for_shutdown_replicated_tables.xml $DEST_S
 ln -sf $SRC_PATH/config.d/backups.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/filesystem_caches_path.xml $DEST_SERVER_PATH/config.d/
 ln -sf $SRC_PATH/config.d/validate_tcp_client_information.xml $DEST_SERVER_PATH/config.d/
+ln -sf $SRC_PATH/config.d/zero_copy_destructive_operations.xml $DEST_SERVER_PATH/config.d/
 
 # Not supported with fasttest.
 if [ "${DEST_SERVER_PATH}" = "/etc/clickhouse-server" ]
@@ -154,6 +156,7 @@ if [[ -n "$EXPORT_S3_STORAGE_POLICIES" ]]; then
     fi
 
     ln -sf $SRC_PATH/config.d/storage_conf.xml $DEST_SERVER_PATH/config.d/
+    ln -sf $SRC_PATH/config.d/storage_conf_02944.xml $DEST_SERVER_PATH/config.d/
     ln -sf $SRC_PATH/users.d/s3_cache.xml $DEST_SERVER_PATH/users.d/
     ln -sf $SRC_PATH/users.d/s3_cache_new.xml $DEST_SERVER_PATH/users.d/
 fi
diff --git a/tests/config/users.d/insert_keeper_retries.xml b/tests/config/users.d/insert_keeper_retries.xml
index 462c9df5248..f01157d40ac 100644
--- a/tests/config/users.d/insert_keeper_retries.xml
+++ b/tests/config/users.d/insert_keeper_retries.xml
@@ -1,8 +1,10 @@
 <clickhouse>
     <profiles>
         <default>
-            <insert_keeper_max_retries>20</insert_keeper_max_retries>
+            <insert_keeper_max_retries>100</insert_keeper_max_retries>
             <insert_keeper_fault_injection_probability>0.01</insert_keeper_fault_injection_probability>
+            <insert_keeper_retry_initial_backoff_ms>1</insert_keeper_retry_initial_backoff_ms>
+            <insert_keeper_retry_max_backoff_ms>1</insert_keeper_retry_max_backoff_ms>
         </default>
     </profiles>
 </clickhouse>
diff --git a/tests/integration/ci-runner.py b/tests/integration/ci-runner.py
index a3ad94a59ec..7c922e339fe 100755
--- a/tests/integration/ci-runner.py
+++ b/tests/integration/ci-runner.py
@@ -1,6 +1,5 @@
 #!/usr/bin/env python3
 
-from collections import defaultdict
 import csv
 import glob
 import json
@@ -8,13 +7,15 @@ import logging
 import os
 import random
 import re
+import shlex
 import shutil
 import string
 import subprocess
 import time
-import shlex
 import zlib  # for crc32
+from collections import defaultdict
 
+from integration_test_images import IMAGES
 
 MAX_RETRY = 1
 NUM_WORKERS = 5
@@ -301,23 +302,6 @@ class ClickhouseIntegrationTestsRunner:
     def shuffle_test_groups(self):
         return self.shuffle_groups != 0
 
-    @staticmethod
-    def get_images_names():
-        return [
-            "clickhouse/dotnet-client",
-            "clickhouse/integration-helper",
-            "clickhouse/integration-test",
-            "clickhouse/integration-tests-runner",
-            "clickhouse/kerberized-hadoop",
-            "clickhouse/kerberos-kdc",
-            "clickhouse/mysql-golang-client",
-            "clickhouse/mysql-java-client",
-            "clickhouse/mysql-js-client",
-            "clickhouse/mysql-php-client",
-            "clickhouse/nginx-dav",
-            "clickhouse/postgresql-java-client",
-        ]
-
     def _pre_pull_images(self, repo_path):
         image_cmd = self._get_runner_image_cmd(repo_path)
 
@@ -523,7 +507,7 @@ class ClickhouseIntegrationTestsRunner:
             os.path.join(repo_path, "tests/integration", "runner"),
             "--docker-image-version",
         ):
-            for img in self.get_images_names():
+            for img in IMAGES:
                 if img == "clickhouse/integration-tests-runner":
                     runner_version = self.get_image_version(img)
                     logging.info(
diff --git a/tests/integration/helpers/cluster.py b/tests/integration/helpers/cluster.py
index 5e4bb32cf94..c0b145b047a 100644
--- a/tests/integration/helpers/cluster.py
+++ b/tests/integration/helpers/cluster.py
@@ -390,6 +390,7 @@ class ClickHouseCluster:
         odbc_bridge_bin_path=None,
         library_bridge_bin_path=None,
         zookeeper_config_path=None,
+        keeper_config_dir=None,
         custom_dockerd_host=None,
         zookeeper_keyfile=None,
         zookeeper_certfile=None,
@@ -426,6 +427,12 @@ class ClickHouseCluster:
             else p.join(HELPERS_DIR, "zookeeper_config.xml")
         )
 
+        self.keeper_config_dir = (
+            p.join(self.base_dir, keeper_config_dir)
+            if keeper_config_dir
+            else HELPERS_DIR
+        )
+
         project_name = (
             pwd.getpwuid(os.getuid()).pw_name + p.basename(self.base_dir) + self.name
         )
@@ -2725,7 +2732,9 @@ class ClickHouseCluster:
                 if self.use_keeper:  # TODO: remove hardcoded paths from here
                     for i in range(1, 4):
                         shutil.copy(
-                            os.path.join(HELPERS_DIR, f"keeper_config{i}.xml"),
+                            os.path.join(
+                                self.keeper_config_dir, f"keeper_config{i}.xml"
+                            ),
                             os.path.join(
                                 self.keeper_instance_dir_prefix + f"{i}", "config"
                             ),
diff --git a/tests/integration/helpers/keeper_utils.py b/tests/integration/helpers/keeper_utils.py
index 1ca17e923e4..39fa0d0f074 100644
--- a/tests/integration/helpers/keeper_utils.py
+++ b/tests/integration/helpers/keeper_utils.py
@@ -279,6 +279,13 @@ def get_leader(cluster, nodes):
     raise Exception("No leader in Keeper cluster.")
 
 
+def get_any_follower(cluster, nodes):
+    for node in nodes:
+        if is_follower(cluster, node):
+            return node
+    raise Exception("No followers in Keeper cluster.")
+
+
 def get_fake_zk(cluster, node, timeout: float = 30.0) -> KazooClient:
     _fake = KazooClient(
         hosts=cluster.get_instance_ip(node.name) + ":9181", timeout=timeout
diff --git a/tests/integration/helpers/postgres_utility.py b/tests/integration/helpers/postgres_utility.py
index 9b431317b4a..468c3b3bb63 100644
--- a/tests/integration/helpers/postgres_utility.py
+++ b/tests/integration/helpers/postgres_utility.py
@@ -22,6 +22,10 @@ postgres_table_template_5 = """
     CREATE TABLE IF NOT EXISTS "{}" (
     key Integer NOT NULL, value UUID, PRIMARY KEY(key))
     """
+postgres_table_template_6 = """
+    CREATE TABLE IF NOT EXISTS "{}" (
+    key Integer NOT NULL, value Text, PRIMARY KEY(key))
+    """
 
 
 def get_postgres_conn(
@@ -140,7 +144,7 @@ class PostgresManager:
             raise ex
 
     def execute(self, query):
-        self.cursor.execute(query)
+        return self.cursor.execute(query)
 
     def prepare(self):
         self.conn = get_postgres_conn(ip=self.ip, port=self.port)
@@ -189,11 +193,11 @@ class PostgresManager:
         database_name = self.database_or_default(database_name)
         self.drop_postgres_db(database_name)
         self.created_postgres_db_list.add(database_name)
-        self.cursor.execute(f"CREATE DATABASE {database_name}")
+        self.cursor.execute(f'CREATE DATABASE "{database_name}"')
 
     def drop_postgres_db(self, database_name=""):
         database_name = self.database_or_default(database_name)
-        self.cursor.execute(f"DROP DATABASE IF EXISTS {database_name} WITH (FORCE)")
+        self.cursor.execute(f'DROP DATABASE IF EXISTS "{database_name}" WITH (FORCE)')
         if database_name in self.created_postgres_db_list:
             self.created_postgres_db_list.remove(database_name)
 
@@ -212,19 +216,19 @@ class PostgresManager:
         if len(schema_name) == 0:
             self.instance.query(
                 f"""
-                    CREATE DATABASE {database_name}
+                    CREATE DATABASE \"{database_name}\"
                     ENGINE = PostgreSQL('{self.ip}:{self.port}', '{postgres_database}', 'postgres', 'mysecretpassword')"""
             )
         else:
             self.instance.query(
                 f"""
-                CREATE DATABASE {database_name}
+                CREATE DATABASE \"{database_name}\"
                 ENGINE = PostgreSQL('{self.ip}:{self.port}', '{postgres_database}', 'postgres', 'mysecretpassword', '{schema_name}')"""
             )
 
     def drop_clickhouse_postgres_db(self, database_name=""):
         database_name = self.database_or_default(database_name)
-        self.instance.query(f"DROP DATABASE IF EXISTS {database_name}")
+        self.instance.query(f'DROP DATABASE IF EXISTS "{database_name}"')
         if database_name in self.created_ch_postgres_db_list:
             self.created_ch_postgres_db_list.remove(database_name)
 
@@ -236,12 +240,14 @@ class PostgresManager:
         postgres_database="",
         settings=[],
         table_overrides="",
+        user="postgres",
+        password="mysecretpassword",
     ):
         postgres_database = self.database_or_default(postgres_database)
         self.created_materialized_postgres_db_list.add(materialized_database)
         self.instance.query(f"DROP DATABASE IF EXISTS {materialized_database}")
 
-        create_query = f"CREATE DATABASE {materialized_database} ENGINE = MaterializedPostgreSQL('{ip}:{port}', '{postgres_database}', 'postgres', 'mysecretpassword')"
+        create_query = f"CREATE DATABASE {materialized_database} ENGINE = MaterializedPostgreSQL('{ip}:{port}', '{postgres_database}', '{user}', '{password}')"
         if len(settings) > 0:
             create_query += " SETTINGS "
             for i in range(len(settings)):
@@ -274,9 +280,15 @@ class PostgresManager:
             f"INSERT INTO {database_name}.{table_name} SELECT number, number from numbers(50)"
         )
 
-    def create_and_fill_postgres_tables(self, tables_num, numbers=50, database_name=""):
+    def create_and_fill_postgres_tables(
+        self,
+        tables_num,
+        numbers=50,
+        database_name="",
+        table_name_base="postgresql_replica",
+    ):
         for i in range(tables_num):
-            table_name = f"postgresql_replica_{i}"
+            table_name = f"{table_name_base}_{i}"
             create_postgres_table(self.cursor, table_name, database_name)
             if numbers > 0:
                 db = self.database_or_default(database_name)
@@ -362,7 +374,7 @@ def check_tables_are_synchronized(
     result_query = f"select * from {table_path} order by {order_by};"
 
     expected = instance.query(
-        f"select * from {postgres_database}.{table_name} order by {order_by};"
+        f"select * from `{postgres_database}`.`{table_name}` order by {order_by};"
     )
     result = instance.query(result_query)
 
@@ -376,7 +388,7 @@ def check_tables_are_synchronized(
     if result != expected:
         count = int(instance.query(f"select count() from {table_path}"))
         expected_count = int(
-            instance.query(f"select count() from {postgres_database}.{table_name}")
+            instance.query(f"select count() from `{postgres_database}`.`{table_name}`")
         )
         print(f"Having {count}, expected {expected_count}")
     assert result == expected
diff --git a/tests/integration/integration_test_images.py b/tests/integration/integration_test_images.py
new file mode 120000
index 00000000000..1b344702aea
--- /dev/null
+++ b/tests/integration/integration_test_images.py
@@ -0,0 +1 @@
+../ci/integration_test_images.py
\ No newline at end of file
diff --git a/tests/integration/runner b/tests/integration/runner
index 3760bf16b84..b1193b5b471 100755
--- a/tests/integration/runner
+++ b/tests/integration/runner
@@ -1,17 +1,17 @@
 #!/usr/bin/env python3
 # -*- coding: utf-8 -*-
-import subprocess
-import os
-import getpass
-import glob
 import argparse
+import glob
 import logging
-import signal
-import subprocess
-import sys
-import string
+import os
 import random
 import shlex
+import signal
+import string
+import subprocess
+import sys
+
+from integration_test_images import get_docker_env
 
 
 def random_str(length=6):
@@ -335,30 +335,11 @@ if __name__ == "__main__":
     if args.docker_compose_images_tags is not None:
         for img_tag in args.docker_compose_images_tags:
             [image, tag] = img_tag.split(":")
-            if image == "clickhouse/dotnet-client":
-                env_tags += "-e {}={} ".format("DOCKER_DOTNET_CLIENT_TAG", tag)
-            elif image == "clickhouse/integration-helper":
-                env_tags += "-e {}={} ".format("DOCKER_HELPER_TAG", tag)
-            elif image == "clickhouse/integration-test":
-                env_tags += "-e {}={} ".format("DOCKER_BASE_TAG", tag)
-            elif image == "clickhouse/kerberized-hadoop":
-                env_tags += "-e {}={} ".format("DOCKER_KERBERIZED_HADOOP_TAG", tag)
-            elif image == "clickhouse/kerberos-kdc":
-                env_tags += "-e {}={} ".format("DOCKER_KERBEROS_KDC_TAG", tag)
-            elif image == "clickhouse/mysql-golang-client":
-                env_tags += "-e {}={} ".format("DOCKER_MYSQL_GOLANG_CLIENT_TAG", tag)
-            elif image == "clickhouse/mysql-java-client":
-                env_tags += "-e {}={} ".format("DOCKER_MYSQL_JAVA_CLIENT_TAG", tag)
-            elif image == "clickhouse/mysql-js-client":
-                env_tags += "-e {}={} ".format("DOCKER_MYSQL_JS_CLIENT_TAG", tag)
-            elif image == "clickhouse/mysql-php-client":
-                env_tags += "-e {}={} ".format("DOCKER_MYSQL_PHP_CLIENT_TAG", tag)
-            elif image == "clickhouse/nginx-dav":
-                env_tags += "-e {}={} ".format("DOCKER_NGINX_DAV_TAG", tag)
-            elif image == "clickhouse/postgresql-java-client":
-                env_tags += "-e {}={} ".format("DOCKER_POSTGRESQL_JAVA_CLIENT_TAG", tag)
+            env_tag = get_docker_env(image, tag)
+            if env_tag:
+                env_tags += env_tag
             else:
-                logging.info("Unknown image %s" % (image))
+                logging.info("Unknown image %s", image)
 
     # create named volume which will be used inside to store images and other docker related files,
     # to avoid redownloading it every time
diff --git a/tests/integration/test_max_http_connections_for_replication/__init__.py b/tests/integration/test_asynchronous_metrics_pk_bytes_fields/__init__.py
similarity index 100%
rename from tests/integration/test_max_http_connections_for_replication/__init__.py
rename to tests/integration/test_asynchronous_metrics_pk_bytes_fields/__init__.py
diff --git a/tests/integration/test_asynchronous_metrics_pk_bytes_fields/configs/asynchronous_metrics_update_period_s.xml b/tests/integration/test_asynchronous_metrics_pk_bytes_fields/configs/asynchronous_metrics_update_period_s.xml
new file mode 100644
index 00000000000..47e88730482
--- /dev/null
+++ b/tests/integration/test_asynchronous_metrics_pk_bytes_fields/configs/asynchronous_metrics_update_period_s.xml
@@ -0,0 +1,3 @@
+<clickhouse>
+    <asynchronous_metrics_update_period_s>1</asynchronous_metrics_update_period_s>
+</clickhouse>
diff --git a/tests/integration/test_asynchronous_metrics_pk_bytes_fields/test.py b/tests/integration/test_asynchronous_metrics_pk_bytes_fields/test.py
new file mode 100644
index 00000000000..154048df35c
--- /dev/null
+++ b/tests/integration/test_asynchronous_metrics_pk_bytes_fields/test.py
@@ -0,0 +1,132 @@
+import pytest
+import time
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+node = cluster.add_instance(
+    "node",
+    main_configs=["configs/asynchronous_metrics_update_period_s.xml"],
+)
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def greater(a, b):
+    return b > a
+
+
+def lesser(a, b):
+    return b < a
+
+
+def query_until_condition(a, b, condition, retries=20, timeout=60, delay=0.5):
+    """
+
+    :param a: could be an input lambda that returns an int or just an int
+    :param b: could be an input lambda that returns an int or just an int
+    :param condition: lambda that returns a boolean after comparing a and b
+    :param retries: number of times to retry until the condition is met
+    :param timeout: time in seconds after which stop retrying
+    :param delay: time in seconds between each retry
+    :return: values of a and b (value post evaluation if lambda)
+    """
+    retries_done = 0
+    start_time = time.time()
+    while True:
+        res1 = a() if callable(a) else a
+        res2 = b() if callable(b) else b
+        if condition(res1, res2):
+            return res1, res2
+        retries_done += 1
+        if retries_done >= retries or (time.time() - start_time) > timeout:
+            return res1, res2
+        time.sleep(delay)
+
+
+def test_total_pk_bytes_in_memory_fields(started_cluster):
+    query_create = """CREATE TABLE test_pk_bytes
+    (
+       a UInt64,
+       b UInt64
+    )
+    Engine=MergeTree()
+    ORDER BY a SETTINGS index_granularity=1"""
+    node.query(query_create)
+
+    query_pk_bytes = "SELECT value FROM system.asynchronous_metrics WHERE metric = 'TotalPrimaryKeyBytesInMemory';"
+    query_pk_bytes_allocated = """SELECT value FROM system.asynchronous_metrics 
+                                  WHERE metric = 'TotalPrimaryKeyBytesInMemoryAllocated';"""
+
+    # query for metrics before inserting anything into the table
+    pk_bytes_before = int(node.query(query_pk_bytes).strip())
+    pk_bytes_allocated_before = int(node.query(query_pk_bytes_allocated).strip())
+
+    # insert data into the table and select
+    node.query(
+        """INSERT INTO test_pk_bytes SELECT number + 20, number * 20 from numbers(1000000)"""
+    )
+
+    node.query("""SELECT * FROM test_pk_bytes where a > 1000000""")
+
+    # functions to query primary key bytes used and allocated in memory
+    def res_pk_bytes():
+        return int(node.query(query_pk_bytes).strip())
+
+    def res_pk_bytes_allocated():
+        return int(node.query(query_pk_bytes_allocated).strip())
+
+    # query again after data insertion (make a reasonable amount of retries)
+    # metrics should be greater after inserting data
+    pk_bytes_before, pk_bytes_after = query_until_condition(
+        pk_bytes_before, res_pk_bytes, condition=greater
+    )
+    assert pk_bytes_after > pk_bytes_before
+
+    pk_bytes_allocated_before, pk_bytes_allocated_after = query_until_condition(
+        pk_bytes_allocated_before, res_pk_bytes_allocated, condition=greater
+    )
+    assert pk_bytes_allocated_after > pk_bytes_allocated_before
+
+    # insert some more data
+    node.query(
+        """INSERT INTO test_pk_bytes SELECT number + 100, number * 200 from numbers(1000000)"""
+    )
+    node.query("""SELECT * FROM test_pk_bytes""")
+
+    # query again and compare the metrics.
+    # metrics should be greater after inserting more data
+    pk_bytes_after, pk_bytes_after_2 = query_until_condition(
+        pk_bytes_after, res_pk_bytes, condition=greater
+    )
+    assert pk_bytes_after_2 > pk_bytes_after
+
+    pk_bytes_allocated_after, pk_bytes_allocated_after_2 = query_until_condition(
+        pk_bytes_allocated_after, res_pk_bytes_allocated, condition=greater
+    )
+    assert pk_bytes_allocated_after_2 > pk_bytes_allocated_after
+
+    # drop all the data
+    node.query("TRUNCATE table test_pk_bytes;")
+
+    # query again and compare the metrics.
+    # metrics should be lesser after dropping some data
+    before_drop, after_drop = query_until_condition(
+        pk_bytes_after_2, res_pk_bytes, condition=lesser
+    )
+    assert before_drop > after_drop
+
+    before_drop, after_drop = query_until_condition(
+        pk_bytes_allocated_after_2, res_pk_bytes_allocated, condition=lesser
+    )
+    assert before_drop > after_drop
+
+    # finally drop the table
+    node.query("DROP table test_pk_bytes;")
diff --git a/tests/integration/test_reload_query_masking_rules/__init__.py b/tests/integration/test_attach_table_from_s3_plain_readonly/__init__.py
similarity index 100%
rename from tests/integration/test_reload_query_masking_rules/__init__.py
rename to tests/integration/test_attach_table_from_s3_plain_readonly/__init__.py
diff --git a/tests/integration/test_attach_table_from_s3_plain_readonly/configs/config.xml b/tests/integration/test_attach_table_from_s3_plain_readonly/configs/config.xml
new file mode 100644
index 00000000000..106edfc8351
--- /dev/null
+++ b/tests/integration/test_attach_table_from_s3_plain_readonly/configs/config.xml
@@ -0,0 +1,22 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <disk_s3_plain_readonly>
+                <type>s3_plain</type>
+                <endpoint>http://minio1:9001/root/data/disks/disk_s3_plain/</endpoint>
+                <access_key_id>minio</access_key_id>
+                <secret_access_key>minio123</secret_access_key>
+                <readonly>true</readonly>
+            </disk_s3_plain_readonly>
+        </disks>
+        <policies>
+            <s3_plain_readonly>
+                <volumes>
+                    <main>
+                        <disk>disk_s3_plain_readonly</disk>
+                    </main>
+                </volumes>
+            </s3_plain_readonly>
+        </policies>
+    </storage_configuration>
+</clickhouse>
diff --git a/tests/integration/test_attach_table_from_s3_plain_readonly/configs/settings.xml b/tests/integration/test_attach_table_from_s3_plain_readonly/configs/settings.xml
new file mode 100644
index 00000000000..3e6d615557d
--- /dev/null
+++ b/tests/integration/test_attach_table_from_s3_plain_readonly/configs/settings.xml
@@ -0,0 +1,12 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <allow_experimental_database_replicated>1</allow_experimental_database_replicated>
+        </default>
+    </profiles>
+    <users>
+        <default>
+            <profile>default</profile>
+        </default>
+    </users>
+</clickhouse>
diff --git a/tests/integration/test_attach_table_from_s3_plain_readonly/test.py b/tests/integration/test_attach_table_from_s3_plain_readonly/test.py
new file mode 100644
index 00000000000..15ba934e621
--- /dev/null
+++ b/tests/integration/test_attach_table_from_s3_plain_readonly/test.py
@@ -0,0 +1,112 @@
+import re
+import os
+import logging
+import pytest
+
+from helpers.cluster import ClickHouseCluster
+from minio.error import S3Error
+from pathlib import Path
+
+cluster = ClickHouseCluster(__file__)
+
+node1 = cluster.add_instance(
+    "node1",
+    main_configs=["configs/config.xml"],
+    user_configs=["configs/settings.xml"],
+    with_zookeeper=True,
+    with_minio=True,
+    stay_alive=True,
+    macros={"shard": 1, "replica": 1},
+)
+
+node2 = cluster.add_instance(
+    "node2",
+    main_configs=["configs/config.xml"],
+    user_configs=["configs/settings.xml"],
+    with_zookeeper=True,
+    with_minio=True,
+    stay_alive=True,
+    macros={"shard": 1, "replica": 2},
+)
+
+uuid_regex = re.compile("[0-9a-f]{8}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{4}-[0-9a-f]{12}")
+
+
+def upload_to_minio(minio_client, bucket_name, local_path, minio_path=""):
+    local_path = Path(local_path)
+    for root, _, files in os.walk(local_path):
+        for file in files:
+            local_file_path = Path(root) / file
+            minio_object_name = minio_path + str(
+                local_file_path.relative_to(local_path)
+            )
+
+            try:
+                with open(local_file_path, "rb") as data:
+                    file_stat = os.stat(local_file_path)
+                    minio_client.put_object(
+                        bucket_name, minio_object_name, data, file_stat.st_size
+                    )
+                logging.info(f"Uploaded {local_file_path} to {minio_object_name}")
+            except S3Error as e:
+                logging.error(f"Error uploading {local_file_path}: {e}")
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def test_attach_table_from_s3_plain_readonly(started_cluster):
+    # Create an atomic DB with mergetree sample data
+    node1.query(
+        """
+    create database local_db;
+
+    create table local_db.test_table (num UInt32) engine=MergeTree() order by num;
+
+    insert into local_db.test_table (*) Values (5)
+    """
+    )
+
+    assert int(node1.query("select num from local_db.test_table limit 1")) == 5
+
+    # Copy local MergeTree data into minio bucket
+    table_data_path = os.path.join(node1.path, f"database/store")
+    minio = cluster.minio_client
+    upload_to_minio(
+        minio, cluster.minio_bucket, table_data_path, "data/disks/disk_s3_plain/store/"
+    )
+
+    # Drop the non-replicated table, we don't need it anymore
+    table_uuid = node1.query(
+        "SELECT uuid FROM system.tables WHERE database='local_db' AND table='test_table'"
+    ).strip()
+    node1.query("drop table local_db.test_table SYNC;")
+
+    # Create a replicated database
+    node1.query(
+        "create database s3_plain_test_db ENGINE = Replicated('/test/s3_plain_test_db', 'shard1', 'replica1');"
+    )
+    node2.query(
+        "create database s3_plain_test_db ENGINE = Replicated('/test/s3_plain_test_db', 'shard1', 'replica2');"
+    )
+
+    # Create a MergeTree table at one node, by attaching the merge tree data
+    node1.query(
+        f"""
+    attach table s3_plain_test_db.test_table UUID '{table_uuid}' (num UInt32)
+    engine=MergeTree()
+    order by num
+    settings storage_policy = 's3_plain_readonly'
+    """
+    )
+
+    # Check that both nodes can query and get result.
+    assert int(node1.query("select num from s3_plain_test_db.test_table limit 1")) == 5
+    assert int(node2.query("select num from s3_plain_test_db.test_table limit 1")) == 5
diff --git a/tests/integration/test_backup_restore_on_cluster/test_concurrency.py b/tests/integration/test_backup_restore_on_cluster/test_concurrency.py
index ab37846db9a..c08f3c9c242 100644
--- a/tests/integration/test_backup_restore_on_cluster/test_concurrency.py
+++ b/tests/integration/test_backup_restore_on_cluster/test_concurrency.py
@@ -216,7 +216,7 @@ def test_create_or_drop_tables_during_backup(db_engine, table_engine):
             node = nodes[randint(0, num_nodes - 1)]
             # "DROP TABLE IF EXISTS" still can throw some errors (e.g. "WRITE locking attempt on node0 has timed out!")
             # So we use query_and_get_answer_with_error() to ignore any errors.
-            # `lock_acquire_timeout` is also reduced because we don't wait our test to wait too long.
+            # `lock_acquire_timeout` is reduced because we don't wait our test to wait too long.
             node.query_and_get_answer_with_error(
                 f"DROP TABLE IF EXISTS {table_name} SYNC",
                 settings={"lock_acquire_timeout": 10},
@@ -227,15 +227,24 @@ def test_create_or_drop_tables_during_backup(db_engine, table_engine):
             table_name1 = f"mydb.tbl{randint(1, num_nodes)}"
             table_name2 = f"mydb.tbl{randint(1, num_nodes)}"
             node = nodes[randint(0, num_nodes - 1)]
+            # `lock_acquire_timeout` is reduced because we don't wait our test to wait too long.
             node.query_and_get_answer_with_error(
-                f"RENAME TABLE {table_name1} TO {table_name2}"
+                f"RENAME TABLE {table_name1} TO {table_name2}",
+                settings={"lock_acquire_timeout": 10},
             )
 
     def truncate_tables():
         while time.time() < end_time:
             table_name = f"mydb.tbl{randint(1, num_nodes)}"
             node = nodes[randint(0, num_nodes - 1)]
-            node.query(f"TRUNCATE TABLE IF EXISTS {table_name} SYNC")
+            # "TRUNCATE TABLE IF EXISTS" still can throw some errors
+            # (e.g. "WRITE locking attempt on node0 has timed out!" if the table engine is "Log").
+            # So we use query_and_get_answer_with_error() to ignore any errors.
+            # `lock_acquire_timeout` is reduced because we don't wait our test to wait too long.
+            node.query_and_get_answer_with_error(
+                f"TRUNCATE TABLE IF EXISTS {table_name} SYNC",
+                settings={"lock_acquire_timeout": 10},
+            )
 
     def make_backups():
         ids = []
diff --git a/tests/integration/test_backup_restore_s3/configs/disk_s3.xml b/tests/integration/test_backup_restore_s3/configs/disk_s3.xml
index d635e39e13f..45a1e17b039 100644
--- a/tests/integration/test_backup_restore_s3/configs/disk_s3.xml
+++ b/tests/integration/test_backup_restore_s3/configs/disk_s3.xml
@@ -58,5 +58,6 @@
         <allowed_disk>disk_s3</allowed_disk>
         <allowed_disk>disk_s3_plain</allowed_disk>
         <allowed_disk>disk_s3_cache</allowed_disk>
+        <allowed_disk>disk_s3_other_bucket</allowed_disk>
     </backups>
 </clickhouse>
diff --git a/tests/integration/test_backup_restore_s3/test.py b/tests/integration/test_backup_restore_s3/test.py
index 55d40b14ea7..cd8f70b3239 100644
--- a/tests/integration/test_backup_restore_s3/test.py
+++ b/tests/integration/test_backup_restore_s3/test.py
@@ -184,6 +184,32 @@ def test_backup_to_disk(storage_policy, to_disk):
     check_backup_and_restore(storage_policy, backup_destination)
 
 
+@pytest.mark.parametrize(
+    "storage_policy, to_disk",
+    [
+        pytest.param(
+            "policy_s3",
+            "disk_s3_other_bucket",
+            id="from_s3_to_s3",
+        ),
+        pytest.param(
+            "policy_s3_other_bucket",
+            "disk_s3",
+            id="from_s3_to_s3_other_bucket",
+        ),
+    ],
+)
+def test_backup_from_s3_to_s3_disk_native_copy(storage_policy, to_disk):
+    backup_name = new_backup_name()
+    backup_destination = f"Disk('{to_disk}', '{backup_name}')"
+    (backup_events, restore_events) = check_backup_and_restore(
+        storage_policy, backup_destination
+    )
+
+    assert backup_events["S3CopyObject"] > 0
+    assert restore_events["S3CopyObject"] > 0
+
+
 def test_backup_to_s3():
     storage_policy = "default"
     backup_name = new_backup_name()
@@ -419,3 +445,10 @@ def test_backup_with_fs_cache(
     # see MergeTreeData::initializeDirectoriesAndFormatVersion()
     if "CachedWriteBufferCacheWriteBytes" in restore_events:
         assert restore_events["CachedWriteBufferCacheWriteBytes"] <= 1
+
+
+def test_backup_to_zip():
+    storage_policy = "default"
+    backup_name = new_backup_name()
+    backup_destination = f"S3('http://minio1:9001/root/data/backups/{backup_name}.zip', 'minio', 'minio123')"
+    check_backup_and_restore(storage_policy, backup_destination)
diff --git a/tests/integration/test_config_substitutions/configs/000-config_with_env_subst.xml b/tests/integration/test_config_substitutions/configs/000-config_with_env_subst.xml
index ffa26488874..b029dd3bd2e 100644
--- a/tests/integration/test_config_substitutions/configs/000-config_with_env_subst.xml
+++ b/tests/integration/test_config_substitutions/configs/000-config_with_env_subst.xml
@@ -2,6 +2,7 @@
   <profiles>
     <default>
         <max_query_size from_env="MAX_QUERY_SIZE" />
+        <max_threads replace="1" from_env="MAX_THREADS">1</max_threads>
     </default>
   </profiles>
   <users>
diff --git a/tests/integration/test_config_substitutions/test.py b/tests/integration/test_config_substitutions/test.py
index 46961e5da71..564985b2f50 100644
--- a/tests/integration/test_config_substitutions/test.py
+++ b/tests/integration/test_config_substitutions/test.py
@@ -1,6 +1,7 @@
 import pytest
 
 from helpers.cluster import ClickHouseCluster
+from helpers.client import QueryRuntimeException
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance(
@@ -36,9 +37,13 @@ node7 = cluster.add_instance(
         "configs/000-config_with_env_subst.xml",
         "configs/010-env_subst_override.xml",
     ],
-    env_variables={"MAX_QUERY_SIZE": "121212"},
+    env_variables={
+        # overridden with 424242
+        "MAX_QUERY_SIZE": "121212",
+        "MAX_THREADS": "2",
+    },
     instance_env_variables=True,
-)  # overridden with 424242
+)
 
 
 @pytest.fixture(scope="module")
@@ -91,6 +96,65 @@ def test_config(start_cluster):
         node7.query("select value from system.settings where name = 'max_query_size'")
         == "424242\n"
     )
+    assert (
+        node7.query("select value from system.settings where name = 'max_threads'")
+        == "2\n"
+    )
+
+
+def test_config_invalid_overrides(start_cluster):
+    node7.replace_config(
+        "/etc/clickhouse-server/users.d/000-config_with_env_subst.xml",
+        """
+<clickhouse>
+  <profiles>
+    <default>
+        <max_query_size from_env="MAX_QUERY_SIZE" />
+        <max_threads from_env="MAX_THREADS">100</max_threads>
+    </default>
+  </profiles>
+  <users>
+      <default>
+          <password></password>
+          <profile>default</profile>
+          <quota>default</quota>
+      </default>
+
+      <include incl="users_1" />
+      <include incl="users_2" />
+  </users>
+</clickhouse>
+""",
+    )
+    with pytest.raises(
+        QueryRuntimeException,
+        match="Failed to preprocess config '/etc/clickhouse-server/users.xml': Exception: Element <max_threads> has value and does not have 'replace' attribute, can't process from_env substitution",
+    ):
+        node7.query("SYSTEM RELOAD CONFIG")
+    node7.replace_config(
+        "/etc/clickhouse-server/users.d/000-config_with_env_subst.xml",
+        """
+<clickhouse>
+  <profiles>
+    <default>
+        <max_query_size from_env="MAX_QUERY_SIZE" />
+        <max_threads replace="1" from_env="MAX_THREADS">1</max_threads>
+    </default>
+  </profiles>
+  <users>
+      <default>
+          <password></password>
+          <profile>default</profile>
+          <quota>default</quota>
+      </default>
+
+      <include incl="users_1" />
+      <include incl="users_2" />
+  </users>
+</clickhouse>
+""",
+    )
+    node7.query("SYSTEM RELOAD CONFIG")
 
 
 def test_include_config(start_cluster):
diff --git a/tests/integration/test_dictionaries_update_and_reload/test.py b/tests/integration/test_dictionaries_update_and_reload/test.py
index 99d08f1b6ea..3d96d0b8dd4 100644
--- a/tests/integration/test_dictionaries_update_and_reload/test.py
+++ b/tests/integration/test_dictionaries_update_and_reload/test.py
@@ -92,16 +92,16 @@ def test_reload_while_loading(started_cluster):
     assert get_status("slow") == "NOT_LOADED"
     assert get_loading_duration("slow") == 0
 
-    # It's not possible to get a value from the dictionary within 0.5 second, so the following query fails by timeout.
+    # It's not possible to get a value from the dictionary within 1 second, so the following query fails by timeout.
     with pytest.raises(QueryTimeoutExceedException):
-        query("SELECT dictGetInt32('slow', 'a', toUInt64(5))", timeout=0.5)
+        query("SELECT dictGetInt32('slow', 'a', toUInt64(5))", timeout=1)
 
     # The dictionary is now loading.
     assert get_status("slow") == "LOADING"
     start_time, duration = get_loading_start_time("slow"), get_loading_duration("slow")
     assert duration > 0
 
-    time.sleep(0.5)  # Still loading.
+    time.sleep(1)  # Still loading.
     assert get_status("slow") == "LOADING"
     prev_start_time, prev_duration = start_time, duration
     start_time, duration = get_loading_start_time("slow"), get_loading_duration("slow")
@@ -110,14 +110,14 @@ def test_reload_while_loading(started_cluster):
 
     # SYSTEM RELOAD DICTIONARY should restart loading.
     with pytest.raises(QueryTimeoutExceedException):
-        query("SYSTEM RELOAD DICTIONARY 'slow'", timeout=0.5)
+        query("SYSTEM RELOAD DICTIONARY 'slow'", timeout=1)
     assert get_status("slow") == "LOADING"
     prev_start_time, prev_duration = start_time, duration
     start_time, duration = get_loading_start_time("slow"), get_loading_duration("slow")
     assert start_time > prev_start_time
     assert duration < prev_duration
 
-    time.sleep(0.5)  # Still loading.
+    time.sleep(1)  # Still loading.
     assert get_status("slow") == "LOADING"
     prev_start_time, prev_duration = start_time, duration
     start_time, duration = get_loading_start_time("slow"), get_loading_duration("slow")
@@ -128,7 +128,7 @@ def test_reload_while_loading(started_cluster):
     replace_in_file_in_container(
         "/etc/clickhouse-server/dictionaries/slow.xml", "sleep 100", "sleep 0"
     )
-    time.sleep(5)  # Configuration files are reloaded once in 5 seconds.
+    query("SYSTEM RELOAD CONFIG")
 
     # This time loading should finish quickly.
     assert get_status("slow") == "LOADED"
diff --git a/tests/integration/test_reverse_dns_query/__init__.py b/tests/integration/test_distributed_async_insert_for_node_changes/__init__.py
similarity index 100%
rename from tests/integration/test_reverse_dns_query/__init__.py
rename to tests/integration/test_distributed_async_insert_for_node_changes/__init__.py
diff --git a/tests/integration/test_max_http_connections_for_replication/configs/remote_servers.xml b/tests/integration/test_distributed_async_insert_for_node_changes/configs/remote_servers.xml
similarity index 67%
rename from tests/integration/test_max_http_connections_for_replication/configs/remote_servers.xml
rename to tests/integration/test_distributed_async_insert_for_node_changes/configs/remote_servers.xml
index e62425fe1bb..4d2a30dd110 100644
--- a/tests/integration/test_max_http_connections_for_replication/configs/remote_servers.xml
+++ b/tests/integration/test_distributed_async_insert_for_node_changes/configs/remote_servers.xml
@@ -2,39 +2,37 @@
     <remote_servers>
         <test_cluster>
             <shard>
-                <internal_replication>true</internal_replication>
                 <replica>
-                    <default_database>test</default_database>
                     <host>node1</host>
                     <port>9000</port>
                 </replica>
-                <replica>
-                    <default_database>test</default_database>
-                    <host>node2</host>
-                    <port>9000</port>
-                </replica>
             </shard>
-        </test_cluster>
-        <test_cluster>
             <shard>
-                <internal_replication>true</internal_replication>
                 <replica>
-                    <default_database>test</default_database>
                     <host>node3</host>
                     <port>9000</port>
                 </replica>
+            </shard>
+        </test_cluster>
+        <test_cluster_with_replication>
+            <shard>
+                <internal_replication>true</internal_replication>
                 <replica>
-                    <default_database>test</default_database>
-                    <host>node4</host>
-                    <port>9000</port>
-                </replica>
-                <replica>
-                    <default_database>test</default_database>
-                    <host>node5</host>
+                    <host>node1</host>
                     <port>9000</port>
                 </replica>
             </shard>
-        </test_cluster>
-
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>node2</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>node3</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster_with_replication>
     </remote_servers>
 </clickhouse>
diff --git a/tests/integration/test_distributed_async_insert_for_node_changes/test.py b/tests/integration/test_distributed_async_insert_for_node_changes/test.py
new file mode 100644
index 00000000000..6bd6341dcc8
--- /dev/null
+++ b/tests/integration/test_distributed_async_insert_for_node_changes/test.py
@@ -0,0 +1,232 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+
+
+node1 = cluster.add_instance(
+    "node1",
+    main_configs=["configs/remote_servers.xml"],
+)
+
+node2 = cluster.add_instance(
+    "node2",
+    main_configs=["configs/remote_servers.xml"],
+)
+
+node3 = cluster.add_instance(
+    "node3",
+    main_configs=["configs/remote_servers.xml"],
+)
+
+config1 = """<clickhouse>
+    <remote_servers>
+        <test_cluster>
+            <shard>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+            <shard>
+                <replica>
+                    <host>node3</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster>
+        <test_cluster_with_replication>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>node2</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>node3</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster_with_replication>
+    </remote_servers>
+</clickhouse>"""
+
+config2 = """<clickhouse>
+    <remote_servers>
+        <test_cluster>
+            <shard>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+            <shard>
+                <replica>
+                    <host>node2</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+            <shard>
+                <replica>
+                    <host>node3</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster>
+        <test_cluster_with_replication>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>node1</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>node3</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_cluster_with_replication>
+    </remote_servers>
+</clickhouse>
+"""
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        for _, node in cluster.instances.items():
+            node.query(
+                f"""
+                create table dist_local (c1 Int32, c2 String) engine=MergeTree() order by c1;
+                create table dist (c1 Int32, c2 String) engine=Distributed(test_cluster, currentDatabase(), dist_local, c1);
+                create table replica_dist_local (c1 Int32, c2 String) engine=MergeTree() order by c1;
+                create table replica_dist (c1 Int32, c2 String) engine=Distributed(test_cluster_with_replication, currentDatabase(), replica_dist_local, c1);
+                """
+            )
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def test_distributed_async_insert(started_cluster):
+    node1.query("insert into dist select number,'A' from system.numbers limit 10;")
+    node1.query("system flush distributed dist;")
+
+    assert int(node3.query("select count() from dist_local where c2 = 'A'")) == 5
+    assert int(node1.query("select count() from dist_local where c2 = 'A'")) == 5
+
+    # Add node2
+    node1.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config2)
+    node1.query("SYSTEM RELOAD CONFIG;")
+
+    node2.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config2)
+    node2.query("SYSTEM RELOAD CONFIG;")
+
+    node3.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config2)
+    node3.query("SYSTEM RELOAD CONFIG;")
+
+    node1.query("insert into dist select number,'B' from system.numbers limit 12;")
+    node1.query("system flush distributed dist;")
+
+    assert int(node1.query("select count() from dist_local where c2 = 'B'")) == 4
+    assert int(node2.query("select count() from dist_local where c2 = 'B'")) == 4
+    assert int(node3.query("select count() from dist_local where c2 = 'B'")) == 4
+
+    # Delete node2
+    node1.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config1)
+    node1.query("SYSTEM RELOAD CONFIG;")
+
+    node2.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config1)
+    node2.query("SYSTEM RELOAD CONFIG;")
+
+    node3.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config1)
+    node3.query("SYSTEM RELOAD CONFIG;")
+
+    node1.query("insert into dist select number,'C' from system.numbers limit 10;")
+    node1.query("system flush distributed dist;")
+
+    assert int(node1.query("select count() from dist_local where c2 = 'C'")) == 5
+    assert int(node2.query("select count() from dist_local where c2 = 'C'")) == 0
+    assert int(node3.query("select count() from dist_local where c2 = 'C'")) == 5
+
+
+def test_distributed_async_insert_with_replica(started_cluster):
+    node1.query(
+        "insert into replica_dist select number,'A' from system.numbers limit 10;"
+    )
+    node1.query("system flush distributed replica_dist;")
+
+    node2_res = int(
+        node2.query("select count() from replica_dist_local where c2 = 'A'")
+    )
+    node3_res = int(
+        node3.query("select count() from replica_dist_local where c2 = 'A'")
+    )
+
+    assert (
+        int(node1.query("select count() from replica_dist_local where c2 = 'A'")) == 5
+    )
+    assert (node2_res == 0 and node3_res == 5) or (node2_res == 5 and node3_res == 0)
+
+    # Delete node2
+    node1.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config2)
+    node1.query("SYSTEM RELOAD CONFIG;")
+
+    node2.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config2)
+    node2.query("SYSTEM RELOAD CONFIG;")
+
+    node3.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config2)
+    node3.query("SYSTEM RELOAD CONFIG;")
+
+    node1.query(
+        "insert into replica_dist select number,'B' from system.numbers limit 10;"
+    )
+    node1.query("system flush distributed replica_dist;")
+
+    assert (
+        int(node1.query("select count() from replica_dist_local where c2 = 'B'")) == 5
+    )
+    assert (
+        int(node2.query("select count() from replica_dist_local where c2 = 'B'")) == 0
+    )
+    assert (
+        int(node3.query("select count() from replica_dist_local where c2 = 'B'")) == 5
+    )
+
+    # Add node2
+    node1.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config1)
+    node1.query("SYSTEM RELOAD CONFIG;")
+
+    node2.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config1)
+    node2.query("SYSTEM RELOAD CONFIG;")
+
+    node3.replace_config("/etc/clickhouse-server/config.d/remote_servers.xml", config1)
+    node3.query("SYSTEM RELOAD CONFIG;")
+
+    node1.query(
+        "insert into replica_dist select number,'C' from system.numbers limit 10;"
+    )
+    node1.query("system flush distributed replica_dist;")
+
+    node2_res = int(
+        node2.query("select count() from replica_dist_local where c2 = 'C'")
+    )
+    node3_res = int(
+        node3.query("select count() from replica_dist_local where c2 = 'C'")
+    )
+
+    assert (
+        int(node1.query("select count() from replica_dist_local where c2 = 'C'")) == 5
+    )
+    assert (node2_res == 0 and node3_res == 5) or (node2_res == 5 and node3_res == 0)
diff --git a/tests/integration/test_encrypted_disk/configs/storage.xml b/tests/integration/test_encrypted_disk/configs/storage.xml
index 2b84e0d6daa..64c8967a32e 100644
--- a/tests/integration/test_encrypted_disk/configs/storage.xml
+++ b/tests/integration/test_encrypted_disk/configs/storage.xml
@@ -23,6 +23,7 @@
                 <key>1234567812345678</key>
             </disk_s3_encrypted_default_path>
             <s3_cache>
+                <type>cache</type>
                 <disk>disk_s3</disk>
                 <path>s3_cache/</path>
                 <max_size>1Gi</max_size>
@@ -95,7 +96,7 @@
                         <disk>disk_s3_encrypted_default_path</disk>
                     </main>
                 </volumes>
-            </s3_encrypted_default_path>_
+            </s3_encrypted_default_path>
             <s3_encrypted_cache_policy>
                 <volumes>
                     <main>
@@ -105,5 +106,7 @@
             </s3_encrypted_cache_policy>
          </policies>
     </storage_configuration>
+
+    <temporary_data_in_cache>s3_cache</temporary_data_in_cache>
     <allow_remove_stale_moving_parts>true</allow_remove_stale_moving_parts>
 </clickhouse>
diff --git a/tests/integration/test_filesystem_cache/config.d/storage_conf_2.xml b/tests/integration/test_filesystem_cache/config.d/storage_conf_2.xml
new file mode 100644
index 00000000000..a068d7b954c
--- /dev/null
+++ b/tests/integration/test_filesystem_cache/config.d/storage_conf_2.xml
@@ -0,0 +1,24 @@
+<clickhouse>
+    <storage_configuration>
+        <disks>
+            <hdd_blob>
+                <type>local_blob_storage</type>
+                <path>/</path>
+            </hdd_blob>
+            <cache1>
+                <type>cache</type>
+                <disk>hdd_blob</disk>
+                <path>/cache1/</path>
+                <max_size>1Mi</max_size>
+                <cache_on_write_operations>1</cache_on_write_operations>
+            </cache1>
+            <cache2>
+                <type>cache</type>
+                <disk>hdd_blob</disk>
+                <path>/cache1/</path>
+                <max_size>1Mi</max_size>
+                <cache_on_write_operations>1</cache_on_write_operations>
+            </cache2>
+        </disks>
+    </storage_configuration>
+</clickhouse>
diff --git a/tests/integration/test_filesystem_cache/test.py b/tests/integration/test_filesystem_cache/test.py
index 3a6a1ef76eb..ab1bc4e4344 100644
--- a/tests/integration/test_filesystem_cache/test.py
+++ b/tests/integration/test_filesystem_cache/test.py
@@ -21,6 +21,12 @@ def cluster():
             ],
             stay_alive=True,
         )
+        cluster.add_instance(
+            "node_caches_with_same_path",
+            main_configs=[
+                "config.d/storage_conf_2.xml",
+            ],
+        )
 
         logging.info("Starting cluster...")
         cluster.start()
@@ -87,3 +93,104 @@ def test_parallel_cache_loading_on_startup(cluster, node_name):
     )
     node.query("SELECT * FROM test FORMAT Null")
     assert count == int(node.query("SELECT count() FROM test"))
+
+
+@pytest.mark.parametrize("node_name", ["node"])
+def test_caches_with_the_same_configuration(cluster, node_name):
+    node = cluster.instances[node_name]
+    cache_path = "cache1"
+
+    node.query(f"SYSTEM DROP FILESYSTEM CACHE;")
+    for table in ["test", "test2"]:
+        node.query(
+            f"""
+            DROP TABLE IF EXISTS {table} SYNC;
+
+            CREATE TABLE {table} (key UInt32, value String)
+            Engine=MergeTree()
+            ORDER BY value
+            SETTINGS disk = disk(
+                type = cache,
+                name = {table},
+                path = '{cache_path}',
+                disk = 'hdd_blob',
+                max_file_segment_size = '1Ki',
+                boundary_alignment = '1Ki',
+                cache_on_write_operations=1,
+                max_size = '1Mi');
+
+            SET enable_filesystem_cache_on_write_operations=1;
+            INSERT INTO {table} SELECT * FROM generateRandom('a Int32, b String')
+            LIMIT 1000;
+            """
+        )
+
+    size = int(
+        node.query(
+            "SELECT value FROM system.metrics WHERE name = 'FilesystemCacheSize'"
+        )
+    )
+    assert (
+        node.query(
+            "SELECT cache_name, sum(size) FROM system.filesystem_cache GROUP BY cache_name ORDER BY cache_name"
+        ).strip()
+        == f"test\t{size}\ntest2\t{size}"
+    )
+
+    table = "test3"
+    assert (
+        "Found more than one cache configuration with the same path, but with different cache settings"
+        in node.query_and_get_error(
+            f"""
+        DROP TABLE IF EXISTS {table} SYNC;
+
+        CREATE TABLE {table} (key UInt32, value String)
+        Engine=MergeTree()
+        ORDER BY value
+        SETTINGS disk = disk(
+            type = cache,
+            name = {table},
+            path = '{cache_path}',
+            disk = 'hdd_blob',
+            max_file_segment_size = '1Ki',
+            boundary_alignment = '1Ki',
+            cache_on_write_operations=0,
+            max_size = '2Mi');
+        """
+        )
+    )
+
+
+@pytest.mark.parametrize("node_name", ["node_caches_with_same_path"])
+def test_caches_with_the_same_configuration_2(cluster, node_name):
+    node = cluster.instances[node_name]
+    cache_path = "cache1"
+
+    node.query(f"SYSTEM DROP FILESYSTEM CACHE;")
+    for table in ["cache1", "cache2"]:
+        node.query(
+            f"""
+            DROP TABLE IF EXISTS {table} SYNC;
+
+            CREATE TABLE {table} (key UInt32, value String)
+            Engine=MergeTree()
+            ORDER BY value
+            SETTINGS disk = '{table}';
+
+            SET enable_filesystem_cache_on_write_operations=1;
+            INSERT INTO {table} SELECT * FROM generateRandom('a Int32, b String')
+            LIMIT 1000;
+            """
+        )
+
+    size = int(
+        node.query(
+            "SELECT value FROM system.metrics WHERE name = 'FilesystemCacheSize'"
+        )
+    )
+    assert (
+        node.query(
+            "SELECT cache_name, sum(size) FROM system.filesystem_cache GROUP BY cache_name ORDER BY cache_name"
+        ).strip()
+        == f"cache1\t{size}\ncache2\t{size}"
+    )
diff --git a/tests/integration/test_grant_and_revoke/test.py b/tests/integration/test_grant_and_revoke/test.py
index c8a0ee541e2..a86a1208f49 100644
--- a/tests/integration/test_grant_and_revoke/test.py
+++ b/tests/integration/test_grant_and_revoke/test.py
@@ -188,7 +188,7 @@ def test_grant_all_on_table():
         instance.query("SHOW GRANTS FOR B")
         == "GRANT SHOW TABLES, SHOW COLUMNS, SHOW DICTIONARIES, SELECT, INSERT, ALTER TABLE, ALTER VIEW, CREATE TABLE, CREATE VIEW, CREATE DICTIONARY, "
         "DROP TABLE, DROP VIEW, DROP DICTIONARY, UNDROP TABLE, TRUNCATE, OPTIMIZE, BACKUP, CREATE ROW POLICY, ALTER ROW POLICY, DROP ROW POLICY, SHOW ROW POLICIES, "
-        "SYSTEM MERGES, SYSTEM TTL MERGES, SYSTEM FETCHES, SYSTEM MOVES, SYSTEM PULLING REPLICATION LOG, SYSTEM CLEANUP, SYSTEM SENDS, SYSTEM REPLICATION QUEUES, SYSTEM DROP REPLICA, SYSTEM SYNC REPLICA, "
+        "SYSTEM MERGES, SYSTEM TTL MERGES, SYSTEM FETCHES, SYSTEM MOVES, SYSTEM PULLING REPLICATION LOG, SYSTEM CLEANUP, SYSTEM VIEWS, SYSTEM SENDS, SYSTEM REPLICATION QUEUES, SYSTEM DROP REPLICA, SYSTEM SYNC REPLICA, "
         "SYSTEM RESTART REPLICA, SYSTEM RESTORE REPLICA, SYSTEM WAIT LOADING PARTS, SYSTEM FLUSH DISTRIBUTED, dictGet ON test.table TO B\n"
     )
     instance.query("REVOKE ALL ON test.table FROM B", user="A")
diff --git a/tests/integration/test_kafka_bad_messages/test.py b/tests/integration/test_kafka_bad_messages/test.py
index 1633f230f83..954b6042305 100644
--- a/tests/integration/test_kafka_bad_messages/test.py
+++ b/tests/integration/test_kafka_bad_messages/test.py
@@ -294,7 +294,7 @@ def test_bad_messages_parsing_exception(kafka_cluster, max_retries=20):
     ]:
         print(format_name)
 
-        kafka_create_topic(admin_client, f"{format_name}_err")
+        kafka_create_topic(admin_client, f"{format_name}_parsing_err")
 
         instance.query(
             f"""
@@ -305,7 +305,7 @@ def test_bad_messages_parsing_exception(kafka_cluster, max_retries=20):
             CREATE TABLE kafka_{format_name} (key UInt64, value UInt64)
                 ENGINE = Kafka
                 SETTINGS kafka_broker_list = 'kafka1:19092',
-                         kafka_topic_list = '{format_name}_err',
+                         kafka_topic_list = '{format_name}_parsing_err',
                          kafka_group_name = '{format_name}',
                          kafka_format = '{format_name}',
                          kafka_num_consumers = 1;
@@ -316,16 +316,18 @@ def test_bad_messages_parsing_exception(kafka_cluster, max_retries=20):
         )
 
         kafka_produce(
-            kafka_cluster, f"{format_name}_err", ["qwertyuiop", "asdfghjkl", "zxcvbnm"]
+            kafka_cluster,
+            f"{format_name}_parsing_err",
+            ["qwertyuiop", "asdfghjkl", "zxcvbnm"],
         )
 
-    expected_result = """avro::Exception: Invalid data file. Magic does not match: : while parsing Kafka message (topic: Avro_err, partition: 0, offset: 0)\\'|1|1|1|default|kafka_Avro
-Cannot parse input: expected \\'{\\' before: \\'qwertyuiop\\': while parsing Kafka message (topic: JSONEachRow_err, partition: 0, offset: 0|1|1|1|default|kafka_JSONEachRow
+    expected_result = """avro::Exception: Invalid data file. Magic does not match: : while parsing Kafka message (topic: Avro_parsing_err, partition: 0, offset: 0)\\'|1|1|1|default|kafka_Avro
+Cannot parse input: expected \\'{\\' before: \\'qwertyuiop\\': (at row 1)\\n: while parsing Kafka message (topic: JSONEachRow_parsing_err, partition:|1|1|1|default|kafka_JSONEachRow
 """
     # filter out stacktrace in exceptions.text[1] because it is hardly stable enough
     result_system_kafka_consumers = instance.query_with_retry(
         """
-        SELECT substr(exceptions.text[1], 1, 131), length(exceptions.text) > 1 AND length(exceptions.text) < 15, length(exceptions.time) > 1 AND length(exceptions.time) < 15, abs(dateDiff('second', exceptions.time[1], now())) < 40, database, table FROM system.kafka_consumers WHERE table in('kafka_Avro', 'kafka_JSONEachRow') ORDER BY table, assignments.partition_id[1]
+        SELECT substr(exceptions.text[1], 1, 139), length(exceptions.text) > 1 AND length(exceptions.text) < 15, length(exceptions.time) > 1 AND length(exceptions.time) < 15, abs(dateDiff('second', exceptions.time[1], now())) < 40, database, table FROM system.kafka_consumers WHERE table in('kafka_Avro', 'kafka_JSONEachRow') ORDER BY table, assignments.partition_id[1]
         """,
         retry_count=max_retries,
         sleep_time=1,
@@ -338,7 +340,7 @@ Cannot parse input: expected \\'{\\' before: \\'qwertyuiop\\': while parsing Kaf
         "Avro",
         "JSONEachRow",
     ]:
-        kafka_delete_topic(admin_client, f"{format_name}_err")
+        kafka_delete_topic(admin_client, f"{format_name}_parsing_err")
 
 
 def test_bad_messages_to_mv(kafka_cluster, max_retries=20):
diff --git a/tests/queries/0_stateless/01658_substring_ubsan.reference b/tests/integration/test_keeper_http_control/__init__.py
similarity index 100%
rename from tests/queries/0_stateless/01658_substring_ubsan.reference
rename to tests/integration/test_keeper_http_control/__init__.py
diff --git a/tests/integration/test_keeper_http_control/configs/enable_keeper1.xml b/tests/integration/test_keeper_http_control/configs/enable_keeper1.xml
new file mode 100644
index 00000000000..20e3c307f31
--- /dev/null
+++ b/tests/integration/test_keeper_http_control/configs/enable_keeper1.xml
@@ -0,0 +1,37 @@
+<clickhouse>
+    <keeper_server>
+        <tcp_port>9181</tcp_port>
+        <server_id>1</server_id>
+        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
+        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
+
+        <coordination_settings>
+            <operation_timeout_ms>5000</operation_timeout_ms>
+            <session_timeout_ms>10000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+        </coordination_settings>
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>node1</hostname>
+                <port>9234</port>
+            </server>
+            <server>
+                <id>2</id>
+                <hostname>node2</hostname>
+                <port>9234</port>
+                <start_as_follower>true</start_as_follower>
+            </server>
+            <server>
+                <id>3</id>
+                <hostname>node3</hostname>
+                <port>9234</port>
+                <start_as_follower>true</start_as_follower>
+            </server>
+        </raft_configuration>
+        <http_control>
+            <port>9182</port>
+        </http_control>
+    </keeper_server>
+</clickhouse>
diff --git a/tests/integration/test_keeper_http_control/configs/enable_keeper2.xml b/tests/integration/test_keeper_http_control/configs/enable_keeper2.xml
new file mode 100644
index 00000000000..b9002eb2436
--- /dev/null
+++ b/tests/integration/test_keeper_http_control/configs/enable_keeper2.xml
@@ -0,0 +1,37 @@
+<clickhouse>
+    <keeper_server>
+        <tcp_port>9181</tcp_port>
+        <server_id>2</server_id>
+        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
+        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
+
+        <coordination_settings>
+            <operation_timeout_ms>5000</operation_timeout_ms>
+            <session_timeout_ms>10000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+        </coordination_settings>
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>node1</hostname>
+                <port>9234</port>
+            </server>
+            <server>
+                <id>2</id>
+                <hostname>node2</hostname>
+                <port>9234</port>
+                <start_as_follower>true</start_as_follower>
+            </server>
+            <server>
+                <id>3</id>
+                <hostname>node3</hostname>
+                <port>9234</port>
+                <start_as_follower>true</start_as_follower>
+            </server>
+        </raft_configuration>
+        <http_control>
+            <port>9182</port>
+        </http_control>
+    </keeper_server>
+</clickhouse>
diff --git a/tests/integration/test_keeper_http_control/configs/enable_keeper3.xml b/tests/integration/test_keeper_http_control/configs/enable_keeper3.xml
new file mode 100644
index 00000000000..6e4e17399f7
--- /dev/null
+++ b/tests/integration/test_keeper_http_control/configs/enable_keeper3.xml
@@ -0,0 +1,37 @@
+<clickhouse>
+    <keeper_server>
+        <tcp_port>9181</tcp_port>
+        <server_id>3</server_id>
+        <log_storage_path>/var/lib/clickhouse/coordination/log</log_storage_path>
+        <snapshot_storage_path>/var/lib/clickhouse/coordination/snapshots</snapshot_storage_path>
+
+        <coordination_settings>
+            <operation_timeout_ms>5000</operation_timeout_ms>
+            <session_timeout_ms>10000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+        </coordination_settings>
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>node1</hostname>
+                <port>9234</port>
+            </server>
+            <server>
+                <id>2</id>
+                <hostname>node2</hostname>
+                <port>9234</port>
+                <start_as_follower>true</start_as_follower>
+            </server>
+            <server>
+                <id>3</id>
+                <hostname>node3</hostname>
+                <port>9234</port>
+                <start_as_follower>true</start_as_follower>
+            </server>
+        </raft_configuration>
+        <http_control>
+            <port>9182</port>
+        </http_control>
+    </keeper_server>
+</clickhouse>
diff --git a/tests/integration/test_keeper_http_control/test.py b/tests/integration/test_keeper_http_control/test.py
new file mode 100644
index 00000000000..65dc5bea909
--- /dev/null
+++ b/tests/integration/test_keeper_http_control/test.py
@@ -0,0 +1,74 @@
+#!/usr/bin/env python3
+
+import os
+import pytest
+import requests
+
+from helpers.cluster import ClickHouseCluster
+from helpers.network import PartitionManager
+import helpers.keeper_utils as keeper_utils
+
+cluster = ClickHouseCluster(__file__)
+CONFIG_DIR = os.path.join(os.path.dirname(os.path.realpath(__file__)), "configs")
+
+node1 = cluster.add_instance(
+    "node1", main_configs=["configs/enable_keeper1.xml"], stay_alive=True
+)
+node2 = cluster.add_instance(
+    "node2", main_configs=["configs/enable_keeper2.xml"], stay_alive=True
+)
+node3 = cluster.add_instance(
+    "node3", main_configs=["configs/enable_keeper3.xml"], stay_alive=True
+)
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def test_http_readiness_basic_responses(started_cluster):
+    leader = keeper_utils.get_leader(cluster, [node1, node2, node3])
+    response = requests.get(
+        "http://{host}:{port}/ready".format(host=leader.ip_address, port=9182)
+    )
+    assert response.status_code == 200
+
+    readiness_data = response.json()
+    assert readiness_data["status"] == "ok"
+    assert readiness_data["details"]["role"] == "leader"
+
+    follower = keeper_utils.get_any_follower(cluster, [node1, node2, node3])
+    response = requests.get(
+        "http://{host}:{port}/ready".format(host=follower.ip_address, port=9182)
+    )
+    assert response.status_code == 200
+
+    readiness_data = response.json()
+    assert readiness_data["status"] == "ok"
+    assert readiness_data["details"]["role"] == "follower"
+    assert readiness_data["details"]["hasLeader"] == True
+
+
+def test_http_readiness_partitioned_cluster(started_cluster):
+    with PartitionManager() as pm:
+        leader = keeper_utils.get_leader(cluster, [node1, node2, node3])
+        follower = keeper_utils.get_any_follower(cluster, [node1, node2, node3])
+
+        pm.partition_instances(leader, follower)
+        keeper_utils.wait_until_quorum_lost(cluster, follower)
+
+        response = requests.get(
+            "http://{host}:{port}/ready".format(host=follower.ip_address, port=9182)
+        )
+        print(response.json())
+        assert response.status_code == 503
+
+        readiness_data = response.json()
+        assert readiness_data["status"] == "fail"
+        assert readiness_data["details"]["role"] == "follower"
+        assert readiness_data["details"]["hasLeader"] == False
diff --git a/tests/queries/0_stateless/02896_memory_accounting_for_user.reference b/tests/integration/test_keeper_memory_soft_limit/__init__.py
similarity index 100%
rename from tests/queries/0_stateless/02896_memory_accounting_for_user.reference
rename to tests/integration/test_keeper_memory_soft_limit/__init__.py
diff --git a/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config1.xml b/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config1.xml
new file mode 100644
index 00000000000..642cf16414e
--- /dev/null
+++ b/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config1.xml
@@ -0,0 +1,49 @@
+<clickhouse>
+    <listen_try>true</listen_try>
+    <listen_host>::</listen_host>
+    <listen_host>0.0.0.0</listen_host>
+
+    <logger>
+        <level>trace</level>
+        <log>/var/log/clickhouse-keeper/clickhouse-keeper.log</log>
+        <errorlog>/var/log/clickhouse-keeper/clickhouse-keeper.err.log</errorlog>
+    </logger>
+
+    <keeper_server>
+        <tcp_port>2181</tcp_port>
+        <availability_zone>
+            <value>az-zoo1</value>
+        </availability_zone>
+        <server_id>1</server_id>
+        <max_memory_usage_soft_limit>200000000</max_memory_usage_soft_limit>
+
+        <coordination_settings>
+            <operation_timeout_ms>10000</operation_timeout_ms>
+            <session_timeout_ms>15000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+            <force_sync>false</force_sync>
+            <election_timeout_lower_bound_ms>2000</election_timeout_lower_bound_ms>
+            <election_timeout_upper_bound_ms>4000</election_timeout_upper_bound_ms>
+
+            <async_replication>1</async_replication>
+        </coordination_settings>
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>zoo1</hostname>
+                <port>9444</port>
+            </server>
+            <server>
+                <id>2</id>
+                <hostname>zoo2</hostname>
+                <port>9444</port>
+            </server>
+            <server>
+                <id>3</id>
+                <hostname>zoo3</hostname>
+                <port>9444</port>
+            </server>
+        </raft_configuration>
+    </keeper_server>
+</clickhouse>
diff --git a/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config2.xml b/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config2.xml
new file mode 100644
index 00000000000..25ececea3e8
--- /dev/null
+++ b/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config2.xml
@@ -0,0 +1,50 @@
+<clickhouse>
+    <listen_try>true</listen_try>
+    <listen_host>::</listen_host>
+    <listen_host>0.0.0.0</listen_host>
+
+    <logger>
+        <level>trace</level>
+        <log>/var/log/clickhouse-keeper/clickhouse-keeper.log</log>
+        <errorlog>/var/log/clickhouse-keeper/clickhouse-keeper.err.log</errorlog>
+    </logger>
+
+    <keeper_server>
+        <tcp_port>2181</tcp_port>
+        <server_id>2</server_id>
+        <availability_zone>
+            <value>az-zoo2</value>
+            <enable_auto_detection_on_cloud>1</enable_auto_detection_on_cloud>
+        </availability_zone>
+        <max_memory_usage_soft_limit>20000000</max_memory_usage_soft_limit>
+
+        <coordination_settings>
+            <operation_timeout_ms>10000</operation_timeout_ms>
+            <session_timeout_ms>15000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+            <force_sync>false</force_sync>
+            <election_timeout_lower_bound_ms>2000</election_timeout_lower_bound_ms>
+            <election_timeout_upper_bound_ms>4000</election_timeout_upper_bound_ms>
+
+            <async_replication>1</async_replication>
+        </coordination_settings>
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>zoo1</hostname>
+                <port>9444</port>
+            </server>
+            <server>
+                <id>2</id>
+                <hostname>zoo2</hostname>
+                <port>9444</port>
+            </server>
+            <server>
+                <id>3</id>
+                <hostname>zoo3</hostname>
+                <port>9444</port>
+            </server>
+        </raft_configuration>
+    </keeper_server>
+</clickhouse>
diff --git a/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config3.xml b/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config3.xml
new file mode 100644
index 00000000000..81e343b77c9
--- /dev/null
+++ b/tests/integration/test_keeper_memory_soft_limit/configs/keeper_config3.xml
@@ -0,0 +1,47 @@
+<clickhouse>
+    <listen_try>true</listen_try>
+    <listen_host>::</listen_host>
+    <listen_host>0.0.0.0</listen_host>
+
+    <logger>
+        <level>trace</level>
+        <log>/var/log/clickhouse-keeper/clickhouse-keeper.log</log>
+        <errorlog>/var/log/clickhouse-keeper/clickhouse-keeper.err.log</errorlog>
+    </logger>
+
+    <keeper_server>
+        <tcp_port>2181</tcp_port>
+        <server_id>3</server_id>
+
+        <max_memory_usage_soft_limit>20000000</max_memory_usage_soft_limit>
+
+        <coordination_settings>
+            <operation_timeout_ms>10000</operation_timeout_ms>
+            <session_timeout_ms>15000</session_timeout_ms>
+            <raft_logs_level>trace</raft_logs_level>
+            <force_sync>false</force_sync>
+            <election_timeout_lower_bound_ms>2000</election_timeout_lower_bound_ms>
+            <election_timeout_upper_bound_ms>4000</election_timeout_upper_bound_ms>
+
+            <async_replication>1</async_replication>
+        </coordination_settings>
+
+        <raft_configuration>
+            <server>
+                <id>1</id>
+                <hostname>zoo1</hostname>
+                <port>9444</port>
+            </server>
+            <server>
+                <id>2</id>
+                <hostname>zoo2</hostname>
+                <port>9444</port>
+            </server>
+            <server>
+                <id>3</id>
+                <hostname>zoo3</hostname>
+                <port>9444</port>
+            </server>
+        </raft_configuration>
+    </keeper_server>
+</clickhouse>
diff --git a/tests/integration/test_keeper_memory_soft_limit/test.py b/tests/integration/test_keeper_memory_soft_limit/test.py
new file mode 100644
index 00000000000..d6f3d013a7b
--- /dev/null
+++ b/tests/integration/test_keeper_memory_soft_limit/test.py
@@ -0,0 +1,63 @@
+#!/usr/bin/env python3
+import random
+import string
+import pytest
+from helpers.cluster import ClickHouseCluster
+from helpers import keeper_utils
+from kazoo.client import KazooClient, KazooState
+from kazoo.exceptions import ConnectionLoss
+
+cluster = ClickHouseCluster(__file__, keeper_config_dir="configs/")
+
+# clickhouse itself will use external zookeeper
+node = cluster.add_instance(
+    "node",
+    stay_alive=True,
+    with_zookeeper=True,
+)
+
+
+def random_string(length):
+    return "".join(random.choices(string.ascii_lowercase + string.digits, k=length))
+
+
+def get_connection_zk(nodename, timeout=30.0):
+    _fake_zk_instance = KazooClient(
+        hosts=cluster.get_instance_ip(nodename) + ":2181", timeout=timeout
+    )
+    _fake_zk_instance.start()
+    return _fake_zk_instance
+
+
+@pytest.fixture(scope="module")
+def started_cluster():
+    try:
+        cluster.start()
+
+        yield cluster
+
+    finally:
+        cluster.shutdown()
+
+
+def test_soft_limit_create(started_cluster):
+    started_cluster.wait_zookeeper_to_start()
+    try:
+        node_zk = get_connection_zk("zoo1")
+        loop_time = 100000
+        node_zk.create("/test_soft_limit", b"abc")
+
+        for i in range(loop_time):
+            node_zk.create(
+                "/test_soft_limit/node_" + str(i), random_string(1000).encode()
+            )
+    except ConnectionLoss:
+        txn = node_zk.transaction()
+        for i in range(10):
+            txn.delete("/test_soft_limit/node_" + str(i))
+
+        txn.create("/test_soft_limit/node_1000001" + str(i), b"abcde")
+        txn.commit()
+        return
+
+    raise Exception("all records are inserted but no error occurs")
diff --git a/tests/integration/test_max_http_connections_for_replication/test.py b/tests/integration/test_max_http_connections_for_replication/test.py
deleted file mode 100644
index bcb779ee913..00000000000
--- a/tests/integration/test_max_http_connections_for_replication/test.py
+++ /dev/null
@@ -1,157 +0,0 @@
-import time
-from multiprocessing.dummy import Pool
-
-import pytest
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry
-
-
-def _fill_nodes(nodes, shard, connections_count):
-    for node in nodes:
-        node.query(
-            """
-                CREATE DATABASE test;
-
-                CREATE TABLE test_table(date Date, id UInt32, dummy UInt32)
-                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test{shard}/replicated', '{replica}')
-                PARTITION BY date
-                ORDER BY id
-                SETTINGS
-                    replicated_max_parallel_fetches_for_host={connections},
-                    index_granularity=8192;
-            """.format(
-                shard=shard, replica=node.name, connections=connections_count
-            )
-        )
-
-
-cluster = ClickHouseCluster(__file__)
-node1 = cluster.add_instance(
-    "node1",
-    user_configs=[],
-    main_configs=["configs/remote_servers.xml"],
-    with_zookeeper=True,
-)
-node2 = cluster.add_instance(
-    "node2",
-    user_configs=[],
-    main_configs=["configs/remote_servers.xml"],
-    with_zookeeper=True,
-)
-
-
-@pytest.fixture(scope="module")
-def start_small_cluster():
-    try:
-        cluster.start()
-
-        _fill_nodes([node1, node2], 1, 1)
-
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-def test_single_endpoint_connections_count(start_small_cluster):
-    node1.query("TRUNCATE TABLE test_table")
-    node2.query("SYSTEM SYNC REPLICA test_table")
-
-    def task(count):
-        print(("Inserting ten times from {}".format(count)))
-        for i in range(count, count + 10):
-            node1.query("insert into test_table values ('2017-06-16', {}, 0)".format(i))
-
-    p = Pool(10)
-    p.map(task, range(0, 100, 10))
-
-    assert_eq_with_retry(node1, "select count() from test_table", "100")
-    assert_eq_with_retry(node2, "select count() from test_table", "100")
-
-    assert (
-        node2.query(
-            "SELECT value FROM system.events where event='CreatedHTTPConnections'"
-        )
-        == "1\n"
-    )
-
-
-def test_keepalive_timeout(start_small_cluster):
-    node1.query("TRUNCATE TABLE test_table")
-    node2.query("SYSTEM SYNC REPLICA test_table")
-
-    node1.query("insert into test_table values ('2017-06-16', 777, 0)")
-    assert_eq_with_retry(node2, "select count() from test_table", str(1))
-    # Server keepAliveTimeout is 3 seconds, default client session timeout is 8
-    # lets sleep in that interval
-    time.sleep(4)
-
-    node1.query("insert into test_table values ('2017-06-16', 888, 0)")
-
-    time.sleep(3)
-
-    assert_eq_with_retry(node2, "select count() from test_table", str(2))
-
-    assert not node2.contains_in_log(
-        "No message received"
-    ), "Found 'No message received' in clickhouse-server.log"
-
-
-node3 = cluster.add_instance(
-    "node3",
-    user_configs=[],
-    main_configs=["configs/remote_servers.xml"],
-    with_zookeeper=True,
-)
-node4 = cluster.add_instance(
-    "node4",
-    user_configs=[],
-    main_configs=["configs/remote_servers.xml"],
-    with_zookeeper=True,
-)
-node5 = cluster.add_instance(
-    "node5",
-    user_configs=[],
-    main_configs=["configs/remote_servers.xml"],
-    with_zookeeper=True,
-)
-
-
-@pytest.fixture(scope="module")
-def start_big_cluster():
-    try:
-        cluster.start()
-
-        _fill_nodes([node3, node4, node5], 2, 2)
-
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-def test_multiple_endpoint_connections_count(start_big_cluster):
-    def task(count):
-        print(("Inserting ten times from {}".format(count)))
-        if (count / 10) % 2 == 1:
-            node = node3
-        else:
-            node = node4
-
-        for i in range(count, count + 10):
-            node.query("insert into test_table values ('2017-06-16', {}, 0)".format(i))
-
-    p = Pool(10)
-    p.map(task, range(0, 100, 10))
-
-    assert_eq_with_retry(node3, "select count() from test_table", "100")
-    assert_eq_with_retry(node4, "select count() from test_table", "100")
-    assert_eq_with_retry(node5, "select count() from test_table", "100")
-
-    # Two per each host or sometimes less, if fetches are not performed in parallel. But not more.
-    assert (
-        node5.query(
-            "SELECT value FROM system.events where event='CreatedHTTPConnections'"
-        )
-        <= "4\n"
-    )
diff --git a/tests/integration/test_merge_tree_s3/configs/config.d/storage_conf.xml b/tests/integration/test_merge_tree_s3/configs/config.d/storage_conf.xml
index c12bdf064ce..7087c348072 100644
--- a/tests/integration/test_merge_tree_s3/configs/config.d/storage_conf.xml
+++ b/tests/integration/test_merge_tree_s3/configs/config.d/storage_conf.xml
@@ -156,6 +156,10 @@
     <merge_tree>
         <min_bytes_for_wide_part>0</min_bytes_for_wide_part>
         <ratio_of_defaults_for_sparse_serialization>1.0</ratio_of_defaults_for_sparse_serialization>
+        <min_bytes_for_full_part_storage>0</min_bytes_for_full_part_storage>
+        <disable_freeze_partition_for_zero_copy_replication>0</disable_freeze_partition_for_zero_copy_replication>
+        <disable_detach_partition_for_zero_copy_replication>0</disable_detach_partition_for_zero_copy_replication>
+        <disable_fetch_partition_for_zero_copy_replication>0</disable_fetch_partition_for_zero_copy_replication>
     </merge_tree>
 
     <database_catalog_unused_dir_hide_timeout_sec>0</database_catalog_unused_dir_hide_timeout_sec>
diff --git a/tests/integration/test_multiple_disks/test.py b/tests/integration/test_multiple_disks/test.py
index 30669feb6b3..fdd81284b2a 100644
--- a/tests/integration/test_multiple_disks/test.py
+++ b/tests/integration/test_multiple_disks/test.py
@@ -1837,7 +1837,8 @@ def _insert_merge_execute(
             SETTINGS storage_policy='{policy}'
         """.format(
                 name=name, policy=policy
-            )
+            ),
+            settings={"allow_suspicious_ttl_expressions": 1},
         )
 
         for i in range(parts):
diff --git a/tests/integration/test_parallel_replicas_distributed_read_from_all/test.py b/tests/integration/test_parallel_replicas_distributed_read_from_all/test.py
index fa1dfbefe52..8af7bb12595 100644
--- a/tests/integration/test_parallel_replicas_distributed_read_from_all/test.py
+++ b/tests/integration/test_parallel_replicas_distributed_read_from_all/test.py
@@ -119,7 +119,6 @@ def test_read_equally_from_each_replica(start_cluster, prefer_localhost_replica)
                 "allow_experimental_parallel_reading_from_replicas": 2,
                 "prefer_localhost_replica": prefer_localhost_replica,
                 "max_parallel_replicas": 3,
-                "use_hedged_requests": 0,
             },
         )
         == expected_result
@@ -143,9 +142,15 @@ def test_read_equally_from_each_replica(start_cluster, prefer_localhost_replica)
     nodes[0].query(f"system start fetches {table_name}")
     nodes[1].query(f"system start fetches {table_name}")
     nodes[2].query(f"system start fetches {table_name}")
+    # ensure that replica in sync before querying it to get stable result
+    nodes[0].query(f"system start merges {table_name}")
+    nodes[0].query(f"system sync  replica {table_name}")
     assert (
         nodes[0].query(
-            f"SELECT count(), min(key), max(key), sum(key) FROM {table_name}_d"
+            f"SELECT count(), min(key), max(key), sum(key) FROM {table_name}_d",
+            settings={
+                "allow_experimental_parallel_reading_from_replicas": 0,
+            },
         )
         == expected_result
     )
diff --git a/tests/integration/test_parallel_replicas_distributed_skip_shards/test.py b/tests/integration/test_parallel_replicas_distributed_skip_shards/test.py
index 315a9781c8b..af114ade2d7 100644
--- a/tests/integration/test_parallel_replicas_distributed_skip_shards/test.py
+++ b/tests/integration/test_parallel_replicas_distributed_skip_shards/test.py
@@ -84,7 +84,6 @@ def test_skip_unavailable_shards(start_cluster, prefer_localhost_replica):
             settings={
                 "allow_experimental_parallel_reading_from_replicas": 2,
                 "max_parallel_replicas": 3,
-                "use_hedged_requests": 0,
                 "prefer_localhost_replica": prefer_localhost_replica,
                 "skip_unavailable_shards": 1,
                 "connections_with_failover_max_tries": 0,  # just don't wait for unavailable replicas
@@ -119,7 +118,6 @@ def test_error_on_unavailable_shards(start_cluster, prefer_localhost_replica):
             settings={
                 "allow_experimental_parallel_reading_from_replicas": 2,
                 "max_parallel_replicas": 3,
-                "use_hedged_requests": 0,
                 "prefer_localhost_replica": prefer_localhost_replica,
                 "skip_unavailable_shards": 0,
             },
@@ -155,7 +153,6 @@ def test_no_unavailable_shards(start_cluster, skip_unavailable_shards):
             settings={
                 "allow_experimental_parallel_reading_from_replicas": 2,
                 "max_parallel_replicas": 3,
-                "use_hedged_requests": 0,
                 "prefer_localhost_replica": 0,
                 "skip_unavailable_shards": skip_unavailable_shards,
             },
diff --git a/tests/integration/test_parallel_replicas_over_distributed/test.py b/tests/integration/test_parallel_replicas_over_distributed/test.py
index ecfc2ddea63..3d35ec3fa8e 100644
--- a/tests/integration/test_parallel_replicas_over_distributed/test.py
+++ b/tests/integration/test_parallel_replicas_over_distributed/test.py
@@ -129,6 +129,9 @@ def test_parallel_replicas_over_distributed(
     node = nodes[0]
     expected_result = f"6003\t-1999\t1999\t3\n"
 
+    # sync all replicas to get consistent result
+    node.query(f"SYSTEM SYNC REPLICA ON CLUSTER {cluster} {table_name}")
+
     # parallel replicas
     assert (
         node.query(
@@ -137,17 +140,18 @@ def test_parallel_replicas_over_distributed(
                 "allow_experimental_parallel_reading_from_replicas": 2,
                 "prefer_localhost_replica": prefer_localhost_replica,
                 "max_parallel_replicas": max_parallel_replicas,
-                "use_hedged_requests": 0,
             },
         )
         == expected_result
     )
 
-    # sync all replicas to get consistent result by next distributed query
-    node.query(f"SYSTEM SYNC REPLICA ON CLUSTER {cluster} {table_name}")
-
     # w/o parallel replicas
     assert (
-        node.query(f"SELECT count(), min(key), max(key), sum(key) FROM {table_name}_d")
+        node.query(
+            f"SELECT count(), min(key), max(key), sum(key) FROM {table_name}_d",
+            settings={
+                "allow_experimental_parallel_reading_from_replicas": 0,
+            },
+        )
         == expected_result
     )
diff --git a/tests/integration/test_parallel_replicas_skip_shards/test.py b/tests/integration/test_parallel_replicas_skip_shards/test.py
index 3df80ba061e..a18c82a53a9 100644
--- a/tests/integration/test_parallel_replicas_skip_shards/test.py
+++ b/tests/integration/test_parallel_replicas_skip_shards/test.py
@@ -38,7 +38,6 @@ def test_skip_unavailable_shards(start_cluster):
             settings={
                 "allow_experimental_parallel_reading_from_replicas": 2,
                 "max_parallel_replicas": 3,
-                "use_hedged_requests": 0,
                 "skip_unavailable_shards": 1,
                 # "async_socket_for_remote" : 0,
                 # "async_query_sending_for_remote" : 0,
@@ -65,7 +64,6 @@ def test_error_on_unavailable_shards(start_cluster):
             settings={
                 "allow_experimental_parallel_reading_from_replicas": 2,
                 "max_parallel_replicas": 3,
-                "use_hedged_requests": 0,
                 "skip_unavailable_shards": 0,
             },
         )
diff --git a/tests/queries/0_stateless/02910_replicated_with_simple_aggregate_column.reference b/tests/integration/test_parallel_replicas_working_set/__init__.py
similarity index 100%
rename from tests/queries/0_stateless/02910_replicated_with_simple_aggregate_column.reference
rename to tests/integration/test_parallel_replicas_working_set/__init__.py
diff --git a/tests/integration/test_parallel_replicas_working_set/configs/remote_servers.xml b/tests/integration/test_parallel_replicas_working_set/configs/remote_servers.xml
new file mode 100644
index 00000000000..02a315479f8
--- /dev/null
+++ b/tests/integration/test_parallel_replicas_working_set/configs/remote_servers.xml
@@ -0,0 +1,22 @@
+<clickhouse>
+    <remote_servers>
+        <test_single_shard_multiple_replicas>
+            <shard>
+                <internal_replication>true</internal_replication>
+                <replica>
+                    <host>n1</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>n2</host>
+                    <port>9000</port>
+                </replica>
+                <replica>
+                    <host>n3</host>
+                    <port>9000</port>
+                </replica>
+            </shard>
+        </test_single_shard_multiple_replicas>
+    </remote_servers>
+</clickhouse>
+
diff --git a/tests/integration/test_parallel_replicas_working_set/test.py b/tests/integration/test_parallel_replicas_working_set/test.py
new file mode 100644
index 00000000000..0ede9d9b1a5
--- /dev/null
+++ b/tests/integration/test_parallel_replicas_working_set/test.py
@@ -0,0 +1,140 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+
+cluster = ClickHouseCluster(__file__)
+
+nodes = [
+    cluster.add_instance(
+        f"n{i}", main_configs=["configs/remote_servers.xml"], with_zookeeper=True
+    )
+    for i in (1, 2, 3)
+]
+
+
+@pytest.fixture(scope="module", autouse=True)
+def start_cluster():
+    try:
+        cluster.start()
+        yield cluster
+    finally:
+        cluster.shutdown()
+
+
+def create_tables(cluster, table_name, node_with_covering_part):
+    # create replicated tables
+    for node in nodes:
+        node.query(f"DROP TABLE IF EXISTS {table_name} SYNC")
+
+    nodes[0].query(
+        f"""CREATE TABLE IF NOT EXISTS {table_name} (key Int64, value String) Engine=ReplicatedMergeTree('/test_parallel_replicas/shard1/{table_name}', 'r1')
+            ORDER BY (key)"""
+    )
+    nodes[1].query(
+        f"""CREATE TABLE IF NOT EXISTS {table_name} (key Int64, value String) Engine=ReplicatedMergeTree('/test_parallel_replicas/shard1/{table_name}', 'r2')
+            ORDER BY (key)"""
+    )
+    nodes[2].query(
+        f"""CREATE TABLE IF NOT EXISTS {table_name} (key Int64, value String) Engine=ReplicatedMergeTree('/test_parallel_replicas/shard1/{table_name}', 'r3')
+            ORDER BY (key)"""
+    )
+    # stop merges to keep original parts
+    # stop fetches to keep only parts created on the nodes
+    for i in (0, 1, 2):
+        if i != node_with_covering_part:
+            nodes[i].query(f"system stop fetches {table_name}")
+            nodes[i].query(f"system stop merges {table_name}")
+
+    # populate data, equal number of rows for each replica
+    nodes[0].query(
+        f"INSERT INTO {table_name} SELECT number, number FROM numbers(10)",
+    )
+    nodes[0].query(
+        f"INSERT INTO {table_name} SELECT number, number FROM numbers(10, 10)"
+    )
+    nodes[1].query(
+        f"INSERT INTO {table_name} SELECT number, number FROM numbers(20, 10)"
+    )
+    nodes[1].query(
+        f"INSERT INTO {table_name} SELECT number, number FROM numbers(30, 10)"
+    )
+    nodes[2].query(
+        f"INSERT INTO {table_name} SELECT number, number FROM numbers(40, 10)"
+    )
+    nodes[2].query(
+        f"INSERT INTO {table_name} SELECT number, number FROM numbers(50, 10)"
+    )
+    nodes[node_with_covering_part].query(f"system sync replica {table_name}")
+    nodes[node_with_covering_part].query(f"optimize table {table_name}")
+
+    # check we have expected set of parts
+    expected_active_parts = ""
+    if node_with_covering_part == 0:
+        expected_active_parts = (
+            "all_0_5_1\nall_2_2_0\nall_3_3_0\nall_4_4_0\nall_5_5_0\n"
+        )
+
+    if node_with_covering_part == 1:
+        expected_active_parts = (
+            "all_0_0_0\nall_0_5_1\nall_1_1_0\nall_4_4_0\nall_5_5_0\n"
+        )
+
+    if node_with_covering_part == 2:
+        expected_active_parts = (
+            "all_0_0_0\nall_0_5_1\nall_1_1_0\nall_2_2_0\nall_3_3_0\n"
+        )
+
+    assert (
+        nodes[0].query(
+            f"select distinct name from clusterAllReplicas({cluster}, system.parts) where table='{table_name}' and active order by name"
+        )
+        == expected_active_parts
+    )
+
+
+@pytest.mark.parametrize("node_with_covering_part", [0, 1, 2])
+def test_covering_part_in_announcement(start_cluster, node_with_covering_part):
+    """create and populate table in special way (see create_table()),
+    node_with_covering_part contains all parts merged into one,
+    other nodes contain only parts which are result of insert via the node
+    """
+
+    cluster = "test_single_shard_multiple_replicas"
+    table_name = "test_table"
+    create_tables(cluster, table_name, node_with_covering_part)
+
+    # query result can be one of the following outcomes
+    # (1) query result if parallel replicas working set contains all_0_5_1
+    expected_full_result = "60\t0\t59\t1770\n"
+    expected_results = {expected_full_result}
+
+    # (2) query result if parallel replicas working set DOESN'T contain all_0_5_1
+    if node_with_covering_part == 0:
+        expected_results.add("40\t20\t59\t1580\n")
+    if node_with_covering_part == 1:
+        expected_results.add("40\t0\t59\t1180\n")
+    if node_with_covering_part == 2:
+        expected_results.add("40\t0\t39\t780\n")
+
+    # parallel replicas
+    result = nodes[0].query(
+        f"SELECT count(), min(key), max(key), sum(key) FROM {table_name}",
+        settings={
+            "allow_experimental_parallel_reading_from_replicas": 2,
+            "prefer_localhost_replica": 0,
+            "max_parallel_replicas": 3,
+            "use_hedged_requests": 0,
+            "cluster_for_parallel_replicas": cluster,
+        },
+    )
+    assert result in expected_results
+
+    # w/o parallel replicas
+    assert (
+        nodes[node_with_covering_part].query(
+            f"SELECT count(), min(key), max(key), sum(key) FROM {table_name}",
+            settings={
+                "allow_experimental_parallel_reading_from_replicas": 0,
+            },
+        )
+        == expected_full_result
+    )
diff --git a/tests/integration/test_postgresql_replica_database_engine_1/test.py b/tests/integration/test_postgresql_replica_database_engine_1/test.py
index c118080a572..f04425d83d4 100644
--- a/tests/integration/test_postgresql_replica_database_engine_1/test.py
+++ b/tests/integration/test_postgresql_replica_database_engine_1/test.py
@@ -393,18 +393,19 @@ def test_table_schema_changes(started_cluster):
 
 
 def test_many_concurrent_queries(started_cluster):
+    table = "test_many_conc"
     query_pool = [
-        "DELETE FROM postgresql_replica_{} WHERE (value*value) % 3 = 0;",
-        "UPDATE postgresql_replica_{} SET value = value - 125 WHERE key % 2 = 0;",
-        "DELETE FROM postgresql_replica_{} WHERE key % 10 = 0;",
-        "UPDATE postgresql_replica_{} SET value = value*5 WHERE key % 2 = 1;",
-        "DELETE FROM postgresql_replica_{} WHERE value % 2 = 0;",
-        "UPDATE postgresql_replica_{} SET value = value + 2000 WHERE key % 5 = 0;",
-        "DELETE FROM postgresql_replica_{} WHERE value % 3 = 0;",
-        "UPDATE postgresql_replica_{} SET value = value * 2 WHERE key % 3 = 0;",
-        "DELETE FROM postgresql_replica_{} WHERE value % 9 = 2;",
-        "UPDATE postgresql_replica_{} SET value = value + 2  WHERE key % 3 = 1;",
-        "DELETE FROM postgresql_replica_{} WHERE value%5 = 0;",
+        "DELETE FROM {} WHERE (value*value) % 3 = 0;",
+        "UPDATE {} SET value = value - 125 WHERE key % 2 = 0;",
+        "DELETE FROM {} WHERE key % 10 = 0;",
+        "UPDATE {} SET value = value*5 WHERE key % 2 = 1;",
+        "DELETE FROM {} WHERE value % 2 = 0;",
+        "UPDATE {} SET value = value + 2000 WHERE key % 5 = 0;",
+        "DELETE FROM {} WHERE value % 3 = 0;",
+        "UPDATE {} SET value = value * 2 WHERE key % 3 = 0;",
+        "DELETE FROM {} WHERE value % 9 = 2;",
+        "UPDATE {} SET value = value + 2  WHERE key % 3 = 1;",
+        "DELETE FROM {} WHERE value%5 = 0;",
     ]
 
     NUM_TABLES = 5
@@ -415,7 +416,9 @@ def test_many_concurrent_queries(started_cluster):
         database=True,
     )
     cursor = conn.cursor()
-    pg_manager.create_and_fill_postgres_tables(NUM_TABLES, numbers=10000)
+    pg_manager.create_and_fill_postgres_tables(
+        NUM_TABLES, numbers=10000, table_name_base=table
+    )
 
     def attack(thread_id):
         print("thread {}".format(thread_id))
@@ -423,17 +426,23 @@ def test_many_concurrent_queries(started_cluster):
         for i in range(20):
             query_id = random.randrange(0, len(query_pool) - 1)
             table_id = random.randrange(0, 5)  # num tables
+            random_table_name = f"{table}_{table_id}"
+            table_name = f"{table}_{thread_id}"
 
             # random update / delete query
-            cursor.execute(query_pool[query_id].format(table_id))
-            print("table {} query {} ok".format(table_id, query_id))
+            cursor.execute(query_pool[query_id].format(random_table_name))
+            print(
+                "Executing for table {} query: {}".format(
+                    random_table_name, query_pool[query_id]
+                )
+            )
 
             # allow some thread to do inserts (not to violate key constraints)
             if thread_id < 5:
                 print("try insert table {}".format(thread_id))
                 instance.query(
-                    "INSERT INTO postgres_database.postgresql_replica_{} SELECT {}*10000*({} +  number), number from numbers(1000)".format(
-                        i, thread_id, k
+                    "INSERT INTO postgres_database.{} SELECT {}*10000*({} +  number), number from numbers(1000)".format(
+                        table_name, thread_id, k
                     )
                 )
                 k += 1
@@ -443,8 +452,8 @@ def test_many_concurrent_queries(started_cluster):
                     # also change primary key value
                     print("try update primary key {}".format(thread_id))
                     cursor.execute(
-                        "UPDATE postgresql_replica_{} SET key=key%100000+100000*{} WHERE key%{}=0".format(
-                            thread_id, i + 1, i + 1
+                        "UPDATE {table}_{} SET key=key%100000+100000*{} WHERE key%{}=0".format(
+                            table_name, i + 1, i + 1
                         )
                     )
                     print("update primary key {} ok".format(thread_id))
@@ -467,25 +476,25 @@ def test_many_concurrent_queries(started_cluster):
     n[0] = 50000
     for table_id in range(NUM_TABLES):
         n[0] += 1
+        table_name = f"{table}_{table_id}"
         instance.query(
-            "INSERT INTO postgres_database.postgresql_replica_{} SELECT {} +  number, number from numbers(5000)".format(
-                table_id, n[0]
+            "INSERT INTO postgres_database.{} SELECT {} +  number, number from numbers(5000)".format(
+                table_name, n[0]
             )
         )
-        # cursor.execute("UPDATE postgresql_replica_{} SET key=key%100000+100000*{} WHERE key%{}=0".format(table_id, table_id+1, table_id+1))
+        # cursor.execute("UPDATE {table}_{} SET key=key%100000+100000*{} WHERE key%{}=0".format(table_id, table_id+1, table_id+1))
 
     for thread in threads:
         thread.join()
 
     for i in range(NUM_TABLES):
-        check_tables_are_synchronized(instance, "postgresql_replica_{}".format(i))
+        table_name = f"{table}_{i}"
+        check_tables_are_synchronized(instance, table_name)
         count1 = instance.query(
-            "SELECT count() FROM postgres_database.postgresql_replica_{}".format(i)
+            "SELECT count() FROM postgres_database.{}".format(table_name)
         )
         count2 = instance.query(
-            "SELECT count() FROM (SELECT * FROM test_database.postgresql_replica_{})".format(
-                i
-            )
+            "SELECT count() FROM (SELECT * FROM test_database.{})".format(table_name)
         )
         assert int(count1) == int(count2)
         print(count1, count2)
diff --git a/tests/integration/test_postgresql_replica_database_engine_2/configs/log_conf.xml b/tests/integration/test_postgresql_replica_database_engine_2/configs/log_conf.xml
index 6cc1128e130..c9f6195a014 100644
--- a/tests/integration/test_postgresql_replica_database_engine_2/configs/log_conf.xml
+++ b/tests/integration/test_postgresql_replica_database_engine_2/configs/log_conf.xml
@@ -24,4 +24,10 @@
             <database>postgres_database</database>
         </postgres2>
     </named_collections>
+    <text_log>
+        <database>system</database>
+        <table>text_log</table>
+        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
+        <level>Test</level>
+    </text_log>
 </clickhouse>
diff --git a/tests/integration/test_postgresql_replica_database_engine_2/test.py b/tests/integration/test_postgresql_replica_database_engine_2/test.py
index e8053730c44..5553f400c0d 100644
--- a/tests/integration/test_postgresql_replica_database_engine_2/test.py
+++ b/tests/integration/test_postgresql_replica_database_engine_2/test.py
@@ -33,6 +33,7 @@ from helpers.postgres_utility import (
     postgres_table_template_3,
     postgres_table_template_4,
     postgres_table_template_5,
+    postgres_table_template_6,
 )
 from helpers.postgres_utility import queries
 
@@ -58,6 +59,7 @@ instance2 = cluster.add_instance(
 pg_manager = PostgresManager()
 pg_manager2 = PostgresManager()
 pg_manager_instance2 = PostgresManager()
+pg_manager3 = PostgresManager()
 
 
 @pytest.fixture(scope="module")
@@ -80,6 +82,12 @@ def started_cluster():
         pg_manager2.init(
             instance2, cluster.postgres_ip, cluster.postgres_port, "postgres_database2"
         )
+        pg_manager3.init(
+            instance,
+            cluster.postgres_ip,
+            cluster.postgres_port,
+            default_database="postgres-postgres",
+        )
 
         yield cluster
 
@@ -623,30 +631,77 @@ def test_database_with_multiple_non_default_schemas_2(started_cluster):
 def test_table_override(started_cluster):
     table_name = "table_override"
     materialized_database = "test_database"
-    pg_manager.create_postgres_table(table_name, template=postgres_table_template_5)
+
+    pg_manager.create_postgres_table(table_name, template=postgres_table_template_6)
     instance.query(
-        f"create table {table_name}(key Int32, value UUID) engine = PostgreSQL (postgres1, table={table_name})"
+        f"insert into postgres_database.{table_name} select number, 'test' from numbers(10)"
     )
-    instance.query(
-        f"insert into {table_name} select number, generateUUIDv4() from numbers(10)"
-    )
-    table_overrides = f" TABLE OVERRIDE {table_name} (COLUMNS (key Int32, value UUID) PARTITION BY key)"
+
+    table_overrides = f" TABLE OVERRIDE {table_name} (COLUMNS (key Int32, value String) PARTITION BY key)"
     pg_manager.create_materialized_db(
         ip=started_cluster.postgres_ip,
         port=started_cluster.postgres_port,
         settings=[f"materialized_postgresql_tables_list = '{table_name}'"],
+        materialized_database=materialized_database,
         table_overrides=table_overrides,
     )
-    assert_nested_table_is_created(instance, table_name, materialized_database)
-    result = instance.query(f"show create table {materialized_database}.{table_name}")
-    print(result)
-    expected = "CREATE TABLE test_database.table_override\\n(\\n    `key` Int32,\\n    `value` UUID,\\n    `_sign` Int8() MATERIALIZED 1,\\n    `_version` UInt64() MATERIALIZED 1\\n)\\nENGINE = ReplacingMergeTree(_version)\\nPARTITION BY key\\nORDER BY tuple(key)"
-    assert result.strip() == expected
-    time.sleep(5)
-    query = f"select * from {materialized_database}.{table_name} order by key"
-    expected = instance.query(f"select * from {table_name} order by key")
-    instance.query(f"drop table {table_name} sync")
-    assert_eq_with_retry(instance, query, expected)
+
+    check_tables_are_synchronized(
+        instance, table_name, postgres_database=pg_manager.get_default_database()
+    )
+
+    assert 10 == int(
+        instance.query(f"SELECT count() FROM {materialized_database}.{table_name}")
+    )
+
+    expected = "CREATE TABLE test_database.table_override\\n(\\n    `key` Int32,\\n    `value` String,\\n    `_sign` Int8() MATERIALIZED 1,\\n    `_version` UInt64() MATERIALIZED 1\\n)\\nENGINE = ReplacingMergeTree(_version)\\nPARTITION BY key\\nORDER BY tuple(key)"
+    assert (
+        expected
+        == instance.query(
+            f"show create table {materialized_database}.{table_name}"
+        ).strip()
+    )
+
+    assert (
+        "test"
+        == instance.query(
+            f"SELECT value FROM {materialized_database}.{table_name} WHERE key = 2"
+        ).strip()
+    )
+
+    conn = get_postgres_conn(
+        ip=started_cluster.postgres_ip,
+        port=started_cluster.postgres_port,
+        database_name="postgres_database",
+        database=True,
+        auto_commit=True,
+    )
+    cursor = conn.cursor()
+    cursor.execute(f"SELECT count(*) FROM {table_name}")
+    assert 10 == cursor.fetchall()[0][0]
+
+    pg_manager.execute(f"UPDATE {table_name} SET value='kek' WHERE key=2")
+
+    cursor.execute(f"SELECT value FROM {table_name} WHERE key=2")
+    assert "kek" == cursor.fetchall()[0][0]
+
+    pg_manager.execute(f"DELETE FROM {table_name} WHERE key=2")
+
+    cursor.execute(f"SELECT count(*) FROM {table_name}")
+    assert 9 == cursor.fetchall()[0][0]
+
+    conn.close()
+
+    check_tables_are_synchronized(
+        instance, table_name, postgres_database=pg_manager.get_default_database()
+    )
+
+    assert (
+        ""
+        == instance.query(
+            f"SELECT value FROM {materialized_database}.{table_name} WHERE key = 2"
+        ).strip()
+    )
 
 
 def test_materialized_view(started_cluster):
@@ -810,6 +865,235 @@ def test_replica_consumer(started_cluster):
     pg_manager_instance2.clear()
 
 
+def test_bad_connection_options(started_cluster):
+    table = "test_bad_connection_options"
+
+    pg_manager.create_postgres_table(table)
+    instance.query(
+        f"INSERT INTO postgres_database.{table} SELECT number, number from numbers(0, 50)"
+    )
+
+    pg_manager.create_materialized_db(
+        ip=started_cluster.postgres_ip,
+        port=started_cluster.postgres_port,
+        settings=[
+            f"materialized_postgresql_tables_list = '{table}'",
+            "materialized_postgresql_backoff_min_ms = 100",
+            "materialized_postgresql_backoff_max_ms = 100",
+        ],
+        user="postrges",
+        password="kek",
+    )
+
+    instance.wait_for_log_line('role "postrges" does not exist')
+    assert instance.contains_in_log(
+        "<Error> void DB::DatabaseMaterializedPostgreSQL::startSynchronization(): std::exception. Code: 1001, type: pqxx::broken_connection"
+    )
+    assert "test_database" in instance.query("SHOW DATABASES")
+    assert "" == instance.query("show tables from test_database").strip()
+    pg_manager.drop_materialized_db("test_database")
+
+
+def test_failed_load_from_snapshot(started_cluster):
+    if instance.is_built_with_sanitizer() or instance.is_debug_build():
+        pytest.skip(
+            "Sanitizers and debug mode are skipped, because this test thrown logical error"
+        )
+
+    table = "failed_load"
+
+    pg_manager.create_postgres_table(
+        table,
+        template="""
+    CREATE TABLE IF NOT EXISTS "{}" (
+    key text NOT NULL, value text[], PRIMARY KEY(key))
+    """,
+    )
+    instance.query(
+        f"INSERT INTO postgres_database.{table} SELECT number, [1, 2] from numbers(0, 1000000)"
+    )
+
+    # Create a table with wrong table structure
+    assert "Could not convert string to i" in instance.query_and_get_error(
+        f"""
+        SET allow_experimental_materialized_postgresql_table=1;
+        CREATE TABLE {table} (a Int32, b Int32) ENGINE=MaterializedPostgreSQL('{started_cluster.postgres_ip}:{started_cluster.postgres_port}', 'postgres_database', '{table}', 'postgres', 'mysecretpassword') ORDER BY a
+        """
+    )
+
+
+def test_symbols_in_publication_name(started_cluster):
+    table = "test_symbols_in_publication_name"
+
+    pg_manager3.create_postgres_table(table)
+    instance.query(
+        f"INSERT INTO `{pg_manager3.get_default_database()}`.`{table}` SELECT number, number from numbers(0, 50)"
+    )
+
+    pg_manager3.create_materialized_db(
+        ip=started_cluster.postgres_ip,
+        port=started_cluster.postgres_port,
+        settings=[
+            f"materialized_postgresql_tables_list = '{table}'",
+            "materialized_postgresql_backoff_min_ms = 100",
+            "materialized_postgresql_backoff_max_ms = 100",
+        ],
+    )
+    check_tables_are_synchronized(
+        instance, table, postgres_database=pg_manager3.get_default_database()
+    )
+
+
+def test_generated_columns(started_cluster):
+    table = "test_generated_columns"
+
+    pg_manager.create_postgres_table(
+        table,
+        "",
+        f"""CREATE TABLE {table} (
+             key integer PRIMARY KEY,
+             x integer,
+             y integer GENERATED ALWAYS AS (x*2) STORED,
+             z text);
+         """,
+    )
+
+    pg_manager.execute(f"insert into {table} (key, x, z) values (1,1,'1');")
+    pg_manager.execute(f"insert into {table} (key, x, z) values (2,2,'2');")
+
+    pg_manager.create_materialized_db(
+        ip=started_cluster.postgres_ip,
+        port=started_cluster.postgres_port,
+        settings=[
+            f"materialized_postgresql_tables_list = '{table}'",
+            "materialized_postgresql_backoff_min_ms = 100",
+            "materialized_postgresql_backoff_max_ms = 100",
+        ],
+    )
+
+    check_tables_are_synchronized(
+        instance, table, postgres_database=pg_manager.get_default_database()
+    )
+
+    pg_manager.execute(f"insert into {table} (key, x, z) values (3,3,'3');")
+    pg_manager.execute(f"insert into {table} (key, x, z) values (4,4,'4');")
+
+    check_tables_are_synchronized(
+        instance, table, postgres_database=pg_manager.get_default_database()
+    )
+
+    pg_manager.execute(f"insert into {table} (key, x, z) values (5,5,'5');")
+    pg_manager.execute(f"insert into {table} (key, x, z) values (6,6,'6');")
+
+    check_tables_are_synchronized(
+        instance, table, postgres_database=pg_manager.get_default_database()
+    )
+
+
+def test_default_columns(started_cluster):
+    table = "test_default_columns"
+
+    pg_manager.create_postgres_table(
+        table,
+        "",
+        f"""CREATE TABLE {table} (
+             key integer PRIMARY KEY,
+             x integer,
+             y text DEFAULT 'y1',
+             z integer,
+             a text DEFAULT 'a1',
+             b integer);
+         """,
+    )
+
+    pg_manager.execute(f"insert into {table} (key, x, z, b) values (1,1,1,1);")
+    pg_manager.execute(f"insert into {table} (key, x, z, b) values (2,2,2,2);")
+
+    pg_manager.create_materialized_db(
+        ip=started_cluster.postgres_ip,
+        port=started_cluster.postgres_port,
+        settings=[
+            f"materialized_postgresql_tables_list = '{table}'",
+            "materialized_postgresql_backoff_min_ms = 100",
+            "materialized_postgresql_backoff_max_ms = 100",
+        ],
+    )
+
+    check_tables_are_synchronized(
+        instance, table, postgres_database=pg_manager.get_default_database()
+    )
+
+    pg_manager.execute(f"insert into {table} (key, x, z, b) values (3,3,3,3);")
+    pg_manager.execute(f"insert into {table} (key, x, z, b) values (4,4,4,4);")
+
+    check_tables_are_synchronized(
+        instance, table, postgres_database=pg_manager.get_default_database()
+    )
+
+    pg_manager.execute(f"insert into {table} (key, x, z, b) values (5,5,5,5);")
+    pg_manager.execute(f"insert into {table} (key, x, z, b) values (6,6,6,6);")
+
+    check_tables_are_synchronized(
+        instance, table, postgres_database=pg_manager.get_default_database()
+    )
+
+
+def test_dependent_loading(started_cluster):
+    table = "test_dependent_loading"
+
+    pg_manager.create_postgres_table(table)
+    instance.query(
+        f"INSERT INTO postgres_database.{table} SELECT number, number from numbers(0, 50)"
+    )
+
+    instance.query(
+        f"""
+        SET allow_experimental_materialized_postgresql_table=1;
+        CREATE TABLE {table} (key Int32, value Int32)
+        ENGINE=MaterializedPostgreSQL('{started_cluster.postgres_ip}:{started_cluster.postgres_port}', 'postgres_database', '{table}', 'postgres', 'mysecretpassword') ORDER BY key
+        """
+    )
+
+    check_tables_are_synchronized(
+        instance,
+        table,
+        postgres_database=pg_manager.get_default_database(),
+        materialized_database="default",
+    )
+
+    assert 50 == int(instance.query(f"SELECT count() FROM {table}"))
+
+    instance.restart_clickhouse()
+
+    check_tables_are_synchronized(
+        instance,
+        table,
+        postgres_database=pg_manager.get_default_database(),
+        materialized_database="default",
+    )
+
+    assert 50 == int(instance.query(f"SELECT count() FROM {table}"))
+
+    uuid = instance.query(
+        f"SELECT uuid FROM system.tables WHERE name='{table}' and database='default' limit 1"
+    ).strip()
+    nested_table = f"default.`{uuid}_nested`"
+    instance.contains_in_log(
+        f"Table default.{table} has 1 dependencies: {nested_table} (level 1)"
+    )
+
+    instance.query("SYSTEM FLUSH LOGS")
+    nested_time = instance.query(
+        f"SELECT event_time_microseconds FROM system.text_log WHERE message like 'Loading table default.{uuid}_nested' and message not like '%like%'"
+    ).strip()
+    time = instance.query(
+        f"SELECT event_time_microseconds FROM system.text_log WHERE message like 'Loading table default.{table}' and message not like '%like%'"
+    ).strip()
+    instance.query(
+        f"SELECT toDateTime64('{nested_time}', 6) < toDateTime64('{time}', 6)"
+    )
+
+
 if __name__ == "__main__":
     cluster.start()
     input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_prometheus_endpoint/test.py b/tests/integration/test_prometheus_endpoint/test.py
index cf3d2ff2d98..4eedc84b6c4 100644
--- a/tests/integration/test_prometheus_endpoint/test.py
+++ b/tests/integration/test_prometheus_endpoint/test.py
@@ -77,3 +77,11 @@ def test_prometheus_endpoint(start_cluster):
 
     metrics_dict = get_and_check_metrics(10)
     assert metrics_dict["ClickHouseProfileEvents_Query"] >= prev_query_count + 3
+
+    node.query_and_get_error(
+        "SELECT throwIf(1, 'test', toInt16(42)) SETTINGS allow_custom_error_code_in_throwif=1"
+    )
+    metrics_dict = get_and_check_metrics(10)
+
+    assert metrics_dict["ClickHouseErrorMetric_NUMBER_OF_ARGUMENTS_DOESNT_MATCH"] >= 1
+    assert metrics_dict["ClickHouseErrorMetric_ALL"] >= 1
diff --git a/tests/integration/test_quorum_inserts_parallel/test.py b/tests/integration/test_quorum_inserts_parallel/test.py
index 72780c16319..f30f57cc1d6 100644
--- a/tests/integration/test_quorum_inserts_parallel/test.py
+++ b/tests/integration/test_quorum_inserts_parallel/test.py
@@ -115,9 +115,8 @@ def test_parallel_quorum_actually_quorum(started_cluster):
             error = node.query_and_get_error(
                 "INSERT INTO q VALUES(3, 'Hi')", settings=settings
             )
-            assert "DB::Exception: Unknown status, client must retry." in error, error
             assert (
-                "DB::Exception: Timeout while waiting for quorum. (TIMEOUT_EXCEEDED)"
+                "DB::Exception: Unknown quorum status. The data was inserted in the local replica but we could not verify quorum. Reason: Timeout while waiting for quorum"
                 in error
             ), error
 
diff --git a/tests/integration/test_reload_query_masking_rules/configs/changed_settings.xml b/tests/integration/test_reload_query_masking_rules/configs/changed_settings.xml
deleted file mode 100644
index d681496d843..00000000000
--- a/tests/integration/test_reload_query_masking_rules/configs/changed_settings.xml
+++ /dev/null
@@ -1,19 +0,0 @@
-<clickhouse>
-    <query_log>
-        <database>system</database>
-        <table>query_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-        <max_size_rows>1048576</max_size_rows>
-        <reserved_size_rows>8192</reserved_size_rows>
-        <buffer_size_rows_flush_threshold>524288</buffer_size_rows_flush_threshold>
-        <flush_on_crash>false</flush_on_crash>
-    </query_log>
-
-    <query_masking_rules>
-        <rule>
-            <regexp>TOPSECRET.TOPSECRET</regexp>
-            <replace>[hidden]</replace>
-        </rule>
-    </query_masking_rules>
-</clickhouse>
diff --git a/tests/integration/test_reload_query_masking_rules/configs/empty_settings.xml b/tests/integration/test_reload_query_masking_rules/configs/empty_settings.xml
deleted file mode 100644
index 82647ff82b5..00000000000
--- a/tests/integration/test_reload_query_masking_rules/configs/empty_settings.xml
+++ /dev/null
@@ -1,12 +0,0 @@
-<clickhouse>
-    <query_log>
-        <database>system</database>
-        <table>query_log</table>
-        <partition_by>toYYYYMM(event_date)</partition_by>
-        <flush_interval_milliseconds>7500</flush_interval_milliseconds>
-        <max_size_rows>1048576</max_size_rows>
-        <reserved_size_rows>8192</reserved_size_rows>
-        <buffer_size_rows_flush_threshold>524288</buffer_size_rows_flush_threshold>
-        <flush_on_crash>false</flush_on_crash>
-    </query_log>
-</clickhouse>
diff --git a/tests/integration/test_reload_query_masking_rules/test.py b/tests/integration/test_reload_query_masking_rules/test.py
deleted file mode 100644
index f269aefbacb..00000000000
--- a/tests/integration/test_reload_query_masking_rules/test.py
+++ /dev/null
@@ -1,57 +0,0 @@
-import pytest
-import os
-from helpers.cluster import ClickHouseCluster
-from helpers.test_tools import assert_eq_with_retry, assert_logs_contain_with_retry
-
-SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
-cluster = ClickHouseCluster(__file__)
-node = cluster.add_instance("node", user_configs=["configs/empty_settings.xml"])
-
-
-@pytest.fixture(scope="module", autouse=True)
-def started_cluster():
-    try:
-        cluster.start()
-        yield cluster
-    finally:
-        cluster.shutdown()
-
-
-@pytest.fixture(autouse=True)
-def reset_to_normal_settings_after_test():
-    try:
-        node.copy_file_to_container(
-            os.path.join(SCRIPT_DIR, "configs/empty_settings.xml"),
-            "/etc/clickhouse-server/config.d/z.xml",
-        )
-        node.query("SYSTEM RELOAD CONFIG")
-        yield
-    finally:
-        pass
-
-
-# @pytest.mark.parametrize("reload_strategy", ["force", "timeout"])
-def test_reload_query_masking_rules():
-    # At first, empty configuration is fed to ClickHouse. The query
-    # "SELECT 'TOPSECRET.TOPSECRET'" will not be redacted, and the new masking
-    # event will not be registered
-    node.query("SELECT 'TOPSECRET.TOPSECRET'")
-    assert_logs_contain_with_retry(node, "SELECT 'TOPSECRET.TOPSECRET'")
-    assert not node.contains_in_log(r"SELECT '\[hidden\]'")
-    node.rotate_logs()
-
-    node.copy_file_to_container(
-        os.path.join(SCRIPT_DIR, "configs/changed_settings.xml"),
-        "/etc/clickhouse-server/config.d/z.xml",
-    )
-
-    node.query("SYSTEM RELOAD CONFIG")
-
-    # Now the same query will be redacted in the logs and the counter of events
-    # will be incremented
-    node.query("SELECT 'TOPSECRET.TOPSECRET'")
-
-    assert_logs_contain_with_retry(node, r"SELECT '\[hidden\]'")
-    assert not node.contains_in_log("SELECT 'TOPSECRET.TOPSECRET'")
-
-    node.rotate_logs()
diff --git a/tests/integration/test_replicated_fetches_timeouts/configs/timeouts_for_fetches.xml b/tests/integration/test_replicated_fetches_timeouts/configs/timeouts_for_fetches.xml
new file mode 100644
index 00000000000..b163c6f54a1
--- /dev/null
+++ b/tests/integration/test_replicated_fetches_timeouts/configs/timeouts_for_fetches.xml
@@ -0,0 +1 @@
+<clickhouse></clickhouse>
diff --git a/tests/integration/test_replicated_fetches_timeouts/test.py b/tests/integration/test_replicated_fetches_timeouts/test.py
index 7d5da55549c..55fa4b909ba 100644
--- a/tests/integration/test_replicated_fetches_timeouts/test.py
+++ b/tests/integration/test_replicated_fetches_timeouts/test.py
@@ -10,13 +10,25 @@ from helpers.network import PartitionManager
 
 cluster = ClickHouseCluster(__file__)
 node1 = cluster.add_instance(
-    "node1", with_zookeeper=True, main_configs=["configs/server.xml"]
+    "node1",
+    with_zookeeper=True,
+    main_configs=["configs/server.xml", "configs/timeouts_for_fetches.xml"],
 )
 
 node2 = cluster.add_instance(
-    "node2", with_zookeeper=True, main_configs=["configs/server.xml"]
+    "node2",
+    with_zookeeper=True,
+    stay_alive=True,
+    main_configs=["configs/server.xml", "configs/timeouts_for_fetches.xml"],
 )
 
+config = """
+<clickhouse>
+    <replicated_fetches_http_connection_timeout>30</replicated_fetches_http_connection_timeout>
+    <replicated_fetches_http_receive_timeout>1</replicated_fetches_http_receive_timeout>
+</clickhouse>
+"""
+
 
 @pytest.fixture(scope="module")
 def started_cluster():
@@ -49,14 +61,10 @@ def test_no_stall(started_cluster):
     node2.query("SYSTEM STOP FETCHES t")
 
     node1.query(
-        "INSERT INTO t SELECT 1, '{}' FROM numbers(500)".format(
-            get_random_string(104857)
-        )
+        f"INSERT INTO t SELECT 1, '{get_random_string(104857)}' FROM numbers(500)"
     )
     node1.query(
-        "INSERT INTO t SELECT 2, '{}' FROM numbers(500)".format(
-            get_random_string(104857)
-        )
+        f"INSERT INTO t SELECT 2, '{get_random_string(104857)}' FROM numbers(500)"
     )
 
     with PartitionManager() as pm:
@@ -82,14 +90,12 @@ def test_no_stall(started_cluster):
 
         print("Connection timeouts tested!")
 
-        # Increase connection timeout and wait for receive timeouts.
-        node2.query(
-            """
-            ALTER TABLE t
-                MODIFY SETTING replicated_fetches_http_connection_timeout = 30,
-                    replicated_fetches_http_receive_timeout = 1"""
+        node2.replace_config(
+            "/etc/clickhouse-server/config.d/timeouts_for_fetches.xml", config
         )
 
+        node2.restart_clickhouse()
+
         while True:
             timeout_exceptions = int(
                 node2.query(
diff --git a/tests/integration/test_replicated_user_defined_functions/test.py b/tests/integration/test_replicated_user_defined_functions/test.py
index f54be21c4c0..e5f6683b90b 100644
--- a/tests/integration/test_replicated_user_defined_functions/test.py
+++ b/tests/integration/test_replicated_user_defined_functions/test.py
@@ -116,7 +116,7 @@ def test_create_and_replace():
     node1.query("CREATE FUNCTION f1 AS (x, y) -> x + y")
     assert node1.query("SELECT f1(12, 3)") == "15\n"
 
-    expected_error = "User-defined function 'f1' already exists"
+    expected_error = "User-defined object 'f1' already exists"
     assert expected_error in node1.query_and_get_error(
         "CREATE FUNCTION f1 AS (x, y) -> x + 2 * y"
     )
@@ -135,7 +135,7 @@ def test_drop_if_exists():
     node1.query("DROP FUNCTION IF EXISTS f1")
     node1.query("DROP FUNCTION IF EXISTS f1")
 
-    expected_error = "User-defined function 'f1' doesn't exist"
+    expected_error = "User-defined object 'f1' doesn't exist"
     assert expected_error in node1.query_and_get_error("DROP FUNCTION f1")
 
 
diff --git a/tests/integration/test_replicated_users/test.py b/tests/integration/test_replicated_users/test.py
index 489724ed4fb..e34495a0071 100644
--- a/tests/integration/test_replicated_users/test.py
+++ b/tests/integration/test_replicated_users/test.py
@@ -114,6 +114,41 @@ def test_create_replicated_on_cluster_ignore(started_cluster, entity):
     node1.query(f"DROP {entity.keyword} {entity.name} {entity.options}")
 
 
+@pytest.mark.parametrize(
+    "use_on_cluster",
+    [
+        pytest.param(False, id="Without_on_cluster"),
+        pytest.param(True, id="With_ignored_on_cluster"),
+    ],
+)
+def test_grant_revoke_replicated(started_cluster, use_on_cluster: bool):
+    node1.replace_config(
+        "/etc/clickhouse-server/users.d/users.xml",
+        inspect.cleandoc(
+            f"""
+            <clickhouse>
+                <profiles>
+                    <default>
+                        <ignore_on_cluster_for_replicated_access_entities_queries>{int(use_on_cluster)}</ignore_on_cluster_for_replicated_access_entities_queries>
+                    </default>
+                </profiles>
+            </clickhouse>
+            """
+        ),
+    )
+    node1.query("SYSTEM RELOAD CONFIG")
+    on_cluster = "ON CLUSTER default" if use_on_cluster else ""
+
+    node1.query(f"CREATE USER theuser {on_cluster}")
+
+    assert node1.query(f"GRANT {on_cluster} SELECT ON *.* to theuser") == ""
+
+    assert node2.query(f"SHOW GRANTS FOR theuser") == "GRANT SELECT ON *.* TO theuser\n"
+
+    assert node1.query(f"REVOKE {on_cluster} SELECT ON *.* from theuser") == ""
+    node1.query(f"DROP USER theuser {on_cluster}")
+
+
 @pytest.mark.parametrize("entity", entities, ids=get_entity_id)
 def test_create_replicated_if_not_exists_on_cluster(started_cluster, entity):
     node1.query(
diff --git a/tests/integration/test_reverse_dns_query/configs/config.xml b/tests/integration/test_reverse_dns_query/configs/config.xml
deleted file mode 100644
index 5ce55afa2a7..00000000000
--- a/tests/integration/test_reverse_dns_query/configs/config.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<clickhouse>
-    <disable_internal_dns_cache>1</disable_internal_dns_cache>
-</clickhouse>
diff --git a/tests/integration/test_reverse_dns_query/configs/listen_host.xml b/tests/integration/test_reverse_dns_query/configs/listen_host.xml
deleted file mode 100644
index 9c27c612f63..00000000000
--- a/tests/integration/test_reverse_dns_query/configs/listen_host.xml
+++ /dev/null
@@ -1,5 +0,0 @@
-<clickhouse>
-    <listen_host>::</listen_host>
-    <listen_host>0.0.0.0</listen_host>
-    <listen_try>1</listen_try>
-</clickhouse>
diff --git a/tests/integration/test_reverse_dns_query/configs/reverse_dns_function.xml b/tests/integration/test_reverse_dns_query/configs/reverse_dns_function.xml
deleted file mode 100644
index 35d0a07c6a6..00000000000
--- a/tests/integration/test_reverse_dns_query/configs/reverse_dns_function.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<clickhouse>
-    <allow_reverse_dns_query_function>1</allow_reverse_dns_query_function>
-</clickhouse>
diff --git a/tests/integration/test_reverse_dns_query/coredns_config/Corefile b/tests/integration/test_reverse_dns_query/coredns_config/Corefile
deleted file mode 100644
index 3edf37dafa5..00000000000
--- a/tests/integration/test_reverse_dns_query/coredns_config/Corefile
+++ /dev/null
@@ -1,8 +0,0 @@
-. {
-    hosts /example.com {
-        reload "20ms"
-        fallthrough
-    }
-    forward . 127.0.0.11
-    log
-}
diff --git a/tests/integration/test_reverse_dns_query/coredns_config/example.com b/tests/integration/test_reverse_dns_query/coredns_config/example.com
deleted file mode 100644
index 6c6e4cbee2e..00000000000
--- a/tests/integration/test_reverse_dns_query/coredns_config/example.com
+++ /dev/null
@@ -1 +0,0 @@
-filled in runtime, but needs to exist in order to be volume mapped in docker
diff --git a/tests/integration/test_reverse_dns_query/test.py b/tests/integration/test_reverse_dns_query/test.py
deleted file mode 100644
index 00c3956f74f..00000000000
--- a/tests/integration/test_reverse_dns_query/test.py
+++ /dev/null
@@ -1,74 +0,0 @@
-import pytest
-import socket
-from helpers.cluster import ClickHouseCluster, get_docker_compose_path, run_and_check
-from time import sleep
-import os
-
-DOCKER_COMPOSE_PATH = get_docker_compose_path()
-SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
-
-cluster = ClickHouseCluster(__file__)
-
-ch_server = cluster.add_instance(
-    "clickhouse-server",
-    with_coredns=True,
-    main_configs=[
-        "configs/config.xml",
-        "configs/reverse_dns_function.xml",
-        "configs/listen_host.xml",
-    ],
-)
-
-
-@pytest.fixture(scope="module")
-def started_cluster():
-    global cluster
-    try:
-        cluster.start()
-        yield cluster
-
-    finally:
-        cluster.shutdown()
-
-
-def check_ptr_record(ip, hostname):
-    try:
-        host, aliaslist, ipaddrlist = socket.gethostbyaddr(ip)
-        if hostname.lower() == host.lower():
-            return True
-    except socket.herror:
-        pass
-    return False
-
-
-def setup_dns_server(ip):
-    domains_string = "test.example.com"
-    example_file_path = f'{ch_server.env_variables["COREDNS_CONFIG_DIR"]}/example.com'
-    run_and_check(f"echo '{ip} {domains_string}' > {example_file_path}", shell=True)
-
-    # DNS server takes time to reload the configuration.
-    for try_num in range(10):
-        if all(check_ptr_record(ip, host) for host in domains_string.split()):
-            break
-        sleep(1)
-
-
-def setup_ch_server(dns_server_ip):
-    ch_server.exec_in_container(
-        (["bash", "-c", f"echo 'nameserver {dns_server_ip}' > /etc/resolv.conf"])
-    )
-    ch_server.exec_in_container(
-        (["bash", "-c", "echo 'options ndots:0' >> /etc/resolv.conf"])
-    )
-    ch_server.query("SYSTEM DROP DNS CACHE")
-
-
-def test_reverse_dns_query(started_cluster):
-    dns_server_ip = cluster.get_instance_ip(cluster.coredns_host)
-    random_ipv6 = "4ae8:fa0f:ee1d:68c5:0b76:1b79:7ae6:1549"  # https://commentpicker.com/ip-address-generator.php
-    setup_dns_server(random_ipv6)
-    setup_ch_server(dns_server_ip)
-
-    for _ in range(0, 200):
-        response = ch_server.query(f"select reverseDNSQuery('{random_ipv6}')")
-        assert response == "['test.example.com']\n"
diff --git a/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml b/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml
index 7cb7f50582c..8df9e8e8c26 100644
--- a/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml
+++ b/tests/integration/test_s3_zero_copy_replication/configs/config.d/s3.xml
@@ -69,6 +69,9 @@
     <merge_tree>
         <min_bytes_for_wide_part>1024</min_bytes_for_wide_part>
         <old_parts_lifetime>1</old_parts_lifetime>
+        <disable_freeze_partition_for_zero_copy_replication>0</disable_freeze_partition_for_zero_copy_replication>
+        <disable_detach_partition_for_zero_copy_replication>0</disable_detach_partition_for_zero_copy_replication>
+        <disable_fetch_partition_for_zero_copy_replication>0</disable_fetch_partition_for_zero_copy_replication>
         <allow_remote_fs_zero_copy_replication>true</allow_remote_fs_zero_copy_replication>
         <ratio_of_defaults_for_sparse_serialization>1.0</ratio_of_defaults_for_sparse_serialization>
     </merge_tree>
diff --git a/tests/integration/test_storage_azure_blob_storage/test.py b/tests/integration/test_storage_azure_blob_storage/test.py
index 96fff6b891f..3cccd07c134 100644
--- a/tests/integration/test_storage_azure_blob_storage/test.py
+++ b/tests/integration/test_storage_azure_blob_storage/test.py
@@ -910,6 +910,66 @@ def check_cache(instance, expected_files):
     )
 
 
+def test_union_schema_inference_mode(cluster):
+    node = cluster.instances["node"]
+    storage_account_url = cluster.env_variables["AZURITE_STORAGE_ACCOUNT_URL"]
+    account_name = "devstoreaccount1"
+    account_key = "Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw=="
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference1.jsonl', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'a UInt32') VALUES (1)",
+    )
+
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference2.jsonl', '{account_name}', '{account_key}', 'JSONEachRow', 'auto', 'b UInt32') VALUES (2)",
+    )
+
+    node.query("system drop schema cache for azure")
+
+    result = azure_query(
+        node,
+        f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference*.jsonl', '{account_name}', '{account_key}', 'auto', 'auto', 'auto') settings schema_inference_mode='union', describe_compact_output=1 format TSV",
+    )
+    assert result == "a\tNullable(Int64)\nb\tNullable(Int64)\n"
+
+    result = node.query(
+        "select schema_inference_mode, splitByChar('/', source)[-1] as file, schema from system.schema_inference_cache where source like '%test_union_schema_inference%' order by file format TSV"
+    )
+    assert (
+        result == "UNION\ttest_union_schema_inference1.jsonl\ta Nullable(Int64)\n"
+        "UNION\ttest_union_schema_inference2.jsonl\tb Nullable(Int64)\n"
+    )
+    result = azure_query(
+        node,
+        f"select * from azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference*.jsonl', '{account_name}', '{account_key}', 'auto', 'auto', 'auto') order by tuple(*) settings schema_inference_mode='union' format TSV",
+    )
+    assert result == "1\t\\N\n" "\\N\t2\n"
+    node.query(f"system drop schema cache for hdfs")
+    result = azure_query(
+        node,
+        f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference2.jsonl', '{account_name}', '{account_key}', 'auto', 'auto', 'auto') settings schema_inference_mode='union', describe_compact_output=1 format TSV",
+    )
+    assert result == "b\tNullable(Int64)\n"
+
+    result = azure_query(
+        node,
+        f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference*.jsonl', '{account_name}', '{account_key}', 'auto', 'auto', 'auto') settings schema_inference_mode='union', describe_compact_output=1 format TSV",
+    )
+    assert result == "a\tNullable(Int64)\n" "b\tNullable(Int64)\n"
+    azure_query(
+        node,
+        f"INSERT INTO TABLE FUNCTION azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference3.jsonl', '{account_name}', '{account_key}', 'CSV', 'auto', 's String') VALUES ('Error')",
+    )
+
+    error = azure_query(
+        node,
+        f"desc azureBlobStorage('{storage_account_url}', 'cont', 'test_union_schema_inference*.jsonl', '{account_name}', '{account_key}', 'auto', 'auto', 'auto') settings schema_inference_mode='union', describe_compact_output=1 format TSV",
+        expect_error="true",
+    )
+    assert "Cannot extract table structure" in error
+
+
 def test_schema_inference_cache(cluster):
     node = cluster.instances["node"]
     connection_string = cluster.env_variables["AZURITE_CONNECTION_STRING"]
diff --git a/tests/integration/test_storage_azure_blob_storage/test_cluster.py b/tests/integration/test_storage_azure_blob_storage/test_cluster.py
index afcab6c216e..2bd3f24d25f 100644
--- a/tests/integration/test_storage_azure_blob_storage/test_cluster.py
+++ b/tests/integration/test_storage_azure_blob_storage/test_cluster.py
@@ -203,7 +203,7 @@ def test_unset_skip_unavailable_shards(cluster):
     )
     result = azure_query(
         node,
-        f"SELECT count(*) from azureBlobStorageCluster('cluster_non_existent_port','{storage_account_url}', 'cont', 'test_skip_unavailable.csv', "
+        f"SELECT count(*) from azureBlobStorageCluster('cluster_non_existent_port','{storage_account_url}', 'cont', 'test_unset_skip_unavailable.csv', "
         f"'devstoreaccount1','Eby8vdM02xNOcqFlqUwJPLlmEtlCDXJ1OUzFT50uSRZ6IFsuFq2UVErCz4I6tq/K1SZFPTOtr/KBHBeksoGMGw==')",
     )
 
diff --git a/tests/integration/test_storage_hdfs/test.py b/tests/integration/test_storage_hdfs/test.py
index eacb5295079..8ed1e4b6c0e 100644
--- a/tests/integration/test_storage_hdfs/test.py
+++ b/tests/integration/test_storage_hdfs/test.py
@@ -998,6 +998,55 @@ def test_read_subcolumns(started_cluster):
     )
 
 
+def test_union_schema_inference_mode(started_cluster):
+    node = started_cluster.instances["node1"]
+
+    node.query(
+        "insert into function hdfs('hdfs://hdfs1:9000/test_union_schema_inference1.jsonl') select 1 as a"
+    )
+
+    node.query(
+        "insert into function hdfs('hdfs://hdfs1:9000/test_union_schema_inference2.jsonl') select 2 as b"
+    )
+
+    node.query("system drop schema cache for hdfs")
+
+    result = node.query(
+        "desc hdfs('hdfs://hdfs1:9000/test_union_schema_inference*.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+    )
+    assert result == "a\tNullable(Int64)\nb\tNullable(Int64)\n"
+
+    result = node.query(
+        "select schema_inference_mode, splitByChar('/', source)[-1] as file, schema from system.schema_inference_cache where source like '%test_union_schema_inference%' order by file format TSV"
+    )
+    assert (
+        result == "UNION\ttest_union_schema_inference1.jsonl\ta Nullable(Int64)\n"
+        "UNION\ttest_union_schema_inference2.jsonl\tb Nullable(Int64)\n"
+    )
+    result = node.query(
+        "select * from hdfs('hdfs://hdfs1:9000/test_union_schema_inference*.jsonl') order by tuple(*) settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+    )
+    assert result == "1\t\\N\n" "\\N\t2\n"
+    node.query(f"system drop schema cache for hdfs")
+    result = node.query(
+        "desc hdfs('hdfs://hdfs1:9000/test_union_schema_inference2.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+    )
+    assert result == "b\tNullable(Int64)\n"
+
+    result = node.query(
+        "desc hdfs('hdfs://hdfs1:9000/test_union_schema_inference*.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+    )
+    assert result == "a\tNullable(Int64)\n" "b\tNullable(Int64)\n"
+    node.query(
+        f"insert into function hdfs('hdfs://hdfs1:9000/test_union_schema_inference3.jsonl', TSV) select 'Error'"
+    )
+
+    error = node.query_and_get_error(
+        "desc hdfs('hdfs://hdfs1:9000/test_union_schema_inference*.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+    )
+    assert "Cannot extract table structure" in error
+
+
 if __name__ == "__main__":
     cluster.start()
     input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_storage_kafka/clickhouse_path/format_schemas/key_value_message.capnp b/tests/integration/test_storage_kafka/clickhouse_path/format_schemas/key_value_message.capnp
new file mode 100644
index 00000000000..19b7029dba3
--- /dev/null
+++ b/tests/integration/test_storage_kafka/clickhouse_path/format_schemas/key_value_message.capnp
@@ -0,0 +1,7 @@
+@0x99f75f775fe63dae;
+
+struct Message
+{
+    key @0 : UInt64;
+    value @1 : UInt64;
+}
\ No newline at end of file
diff --git a/tests/integration/test_storage_kafka/clickhouse_path/format_schemas/key_value_message.proto b/tests/integration/test_storage_kafka/clickhouse_path/format_schemas/key_value_message.proto
new file mode 100644
index 00000000000..7c9d4ad0850
--- /dev/null
+++ b/tests/integration/test_storage_kafka/clickhouse_path/format_schemas/key_value_message.proto
@@ -0,0 +1,6 @@
+syntax = "proto3";
+
+message Message {
+    uint64 key = 1;
+    uint64 value = 1;
+}
diff --git a/tests/integration/test_storage_kafka/test.py b/tests/integration/test_storage_kafka/test.py
index b1191af60b7..2176b0151ff 100644
--- a/tests/integration/test_storage_kafka/test.py
+++ b/tests/integration/test_storage_kafka/test.py
@@ -4834,6 +4834,103 @@ JSONExtractString(rdkafka_stat, 'type'): consumer
     kafka_delete_topic(admin_client, topic)
 
 
+def test_formats_errors(kafka_cluster):
+    admin_client = KafkaAdminClient(
+        bootstrap_servers="localhost:{}".format(kafka_cluster.kafka_port)
+    )
+
+    for format_name in [
+        "Template",
+        "Regexp",
+        "TSV",
+        "TSVWithNamesAndTypes",
+        "TSKV",
+        "CSV",
+        "CSVWithNames",
+        "CSVWithNamesAndTypes",
+        "CustomSeparated",
+        "CustomSeparatedWithNames",
+        "CustomSeparatedWithNamesAndTypes",
+        "Values",
+        "JSON",
+        "JSONEachRow",
+        "JSONStringsEachRow",
+        "JSONCompactEachRow",
+        "JSONCompactEachRowWithNamesAndTypes",
+        "JSONObjectEachRow",
+        "Avro",
+        "RowBinary",
+        "RowBinaryWithNamesAndTypes",
+        "MsgPack",
+        "JSONColumns",
+        "JSONCompactColumns",
+        "JSONColumnsWithMetadata",
+        "BSONEachRow",
+        "Native",
+        "Arrow",
+        "Parquet",
+        "ORC",
+        "JSONCompactColumns",
+        "Npy",
+        "ParquetMetadata",
+        "CapnProto",
+        "Protobuf",
+        "ProtobufSingle",
+        "ProtobufList",
+        "DWARF",
+        "HiveText",
+        "MySQLDump",
+    ]:
+        kafka_create_topic(admin_client, format_name)
+        table_name = f"kafka_{format_name}"
+
+        instance.query(
+            f"""
+            DROP TABLE IF EXISTS test.view;
+            DROP TABLE IF EXISTS test.{table_name};
+
+            CREATE TABLE test.{table_name} (key UInt64, value UInt64)
+                ENGINE = Kafka
+                SETTINGS kafka_broker_list = 'kafka1:19092',
+                         kafka_topic_list = '{format_name}',
+                         kafka_group_name = '{format_name}',
+                         kafka_format = '{format_name}',
+                         kafka_max_rows_per_message = 5,
+                         format_template_row='template_row.format',
+                         format_regexp='id: (.+?)',
+                         input_format_with_names_use_header=0,
+                         format_schema='key_value_message:Message';
+
+            CREATE MATERIALIZED VIEW test.view Engine=Log AS
+                SELECT key, value FROM test.{table_name};
+        """
+        )
+
+        kafka_produce(
+            kafka_cluster,
+            format_name,
+            ["Broken message\nBroken message\nBroken message\n"],
+        )
+
+        attempt = 0
+        num_errors = 0
+        while attempt < 200:
+            num_errors = int(
+                instance.query(
+                    f"SELECT length(exceptions.text) from system.kafka_consumers where database = 'test' and table = '{table_name}'"
+                )
+            )
+            if num_errors > 0:
+                break
+            attempt += 1
+
+        assert num_errors > 0
+
+        kafka_delete_topic(admin_client, format_name)
+        instance.query(f"DROP TABLE test.{table_name}")
+        instance.query("DROP TABLE test.view")
+
+
 if __name__ == "__main__":
     cluster.start()
     input("Cluster created, press any key to destroy...")
diff --git a/tests/integration/test_storage_postgresql/configs/named_collections.xml b/tests/integration/test_storage_postgresql/configs/named_collections.xml
index 129225f36b9..4923c21d0a6 100644
--- a/tests/integration/test_storage_postgresql/configs/named_collections.xml
+++ b/tests/integration/test_storage_postgresql/configs/named_collections.xml
@@ -29,5 +29,12 @@
             <database>postgres</database>
             <table>test_replicas</table>
         </postgres4>
+        <postgres5>
+            <user>postgres</user>
+            <password>mysecretpassword</password>
+            <addresses_expr>postgres1:5432</addresses_expr>
+            <database>postgres</database>
+            <table>test_table</table>
+        </postgres5>
     </named_collections>
 </clickhouse>
diff --git a/tests/integration/test_storage_postgresql/test.py b/tests/integration/test_storage_postgresql/test.py
index 11729a5ab18..d9f3a9917ab 100644
--- a/tests/integration/test_storage_postgresql/test.py
+++ b/tests/integration/test_storage_postgresql/test.py
@@ -82,6 +82,30 @@ def test_postgres_select_insert(started_cluster):
     cursor.execute(f"DROP TABLE {table_name} ")
 
 
+def test_postgres_addresses_expr(started_cluster):
+    cursor = started_cluster.postgres_conn.cursor()
+    table_name = "test_table"
+    table = f"""postgresql(`postgres5`)"""
+    cursor.execute(f"DROP TABLE IF EXISTS {table_name}")
+    cursor.execute(f"CREATE TABLE {table_name} (a integer, b text, c integer)")
+
+    node1.query(
+        f"""
+        INSERT INTO TABLE FUNCTION {table}
+        SELECT number, concat('name_', toString(number)), 3 from numbers(10000)"""
+    )
+    check1 = f"SELECT count() FROM {table}"
+    check2 = f"SELECT Sum(c) FROM {table}"
+    check3 = f"SELECT count(c) FROM {table} WHERE a % 2 == 0"
+    check4 = f"SELECT count() FROM {table} WHERE b LIKE concat('name_', toString(1))"
+    assert (node1.query(check1)).rstrip() == "10000"
+    assert (node1.query(check2)).rstrip() == "30000"
+    assert (node1.query(check3)).rstrip() == "5000"
+    assert (node1.query(check4)).rstrip() == "1"
+
+    cursor.execute(f"DROP TABLE {table_name} ")
+
+
 def test_postgres_conversions(started_cluster):
     cursor = started_cluster.postgres_conn.cursor()
     cursor.execute(f"DROP TABLE IF EXISTS test_types")
@@ -90,20 +114,20 @@ def test_postgres_conversions(started_cluster):
     cursor.execute(
         """CREATE TABLE test_types (
         a smallint, b integer, c bigint, d real, e double precision, f serial, g bigserial,
-        h timestamp, i date, j decimal(5, 3), k numeric, l boolean)"""
+        h timestamp, i date, j decimal(5, 3), k numeric, l boolean, "M" integer)"""
     )
     node1.query(
         """
         INSERT INTO TABLE FUNCTION postgresql('postgres1:5432', 'postgres', 'test_types', 'postgres', 'mysecretpassword') VALUES
-        (-32768, -2147483648, -9223372036854775808, 1.12345, 1.1234567890, 2147483647, 9223372036854775807, '2000-05-12 12:12:12.012345', '2000-05-12', 22.222, 22.222, 1)"""
+        (-32768, -2147483648, -9223372036854775808, 1.12345, 1.1234567890, 2147483647, 9223372036854775807, '2000-05-12 12:12:12.012345', '2000-05-12', 22.222, 22.222, 1, 42)"""
     )
     result = node1.query(
         """
-        SELECT a, b, c, d, e, f, g, h, i, j, toDecimal128(k, 3), l FROM postgresql('postgres1:5432', 'postgres', 'test_types', 'postgres', 'mysecretpassword')"""
+        SELECT a, b, c, d, e, f, g, h, i, j, toDecimal128(k, 3), l, "M" FROM postgresql('postgres1:5432', 'postgres', 'test_types', 'postgres', 'mysecretpassword')"""
     )
     assert (
         result
-        == "-32768\t-2147483648\t-9223372036854775808\t1.12345\t1.123456789\t2147483647\t9223372036854775807\t2000-05-12 12:12:12.012345\t2000-05-12\t22.222\t22.222\t1\n"
+        == "-32768\t-2147483648\t-9223372036854775808\t1.12345\t1.123456789\t2147483647\t9223372036854775807\t2000-05-12 12:12:12.012345\t2000-05-12\t22.222\t22.222\t1\t42\n"
     )
 
     cursor.execute(
@@ -132,7 +156,8 @@ def test_postgres_conversions(started_cluster):
                 i Char(2)[][][][],                          -- Nullable(String)
                 j Char(2)[],                                -- Nullable(String)
                 k UUID[],                                   -- Nullable(UUID)
-                l UUID[][]                                  -- Nullable(UUID)
+                l UUID[][],                                 -- Nullable(UUID)
+                "M" integer[] NOT NULL                      -- Int32 (mixed-case identifier)
            )"""
     )
 
@@ -152,7 +177,8 @@ def test_postgres_conversions(started_cluster):
         "i\tArray(Array(Array(Array(Nullable(String)))))\t\t\t\t\t\n"
         "j\tArray(Nullable(String))\t\t\t\t\t\n"
         "k\tArray(Nullable(UUID))\t\t\t\t\t\n"
-        "l\tArray(Array(Nullable(UUID)))"
+        "l\tArray(Array(Nullable(UUID)))\t\t\t\t\t\n"
+        "M\tArray(Int32)"
         ""
     )
     assert result.rstrip() == expected
@@ -171,7 +197,8 @@ def test_postgres_conversions(started_cluster):
         "[[[[NULL]]]], "
         "[], "
         "['2a0c0bfc-4fec-4e32-ae3a-7fc8eea6626a', '42209d53-d641-4d73-a8b6-c038db1e75d6', NULL], "
-        "[[NULL, '42209d53-d641-4d73-a8b6-c038db1e75d6'], ['2a0c0bfc-4fec-4e32-ae3a-7fc8eea6626a', NULL], [NULL, NULL]]"
+        "[[NULL, '42209d53-d641-4d73-a8b6-c038db1e75d6'], ['2a0c0bfc-4fec-4e32-ae3a-7fc8eea6626a', NULL], [NULL, NULL]],"
+        "[42, 42, 42]"
         ")"
     )
 
@@ -191,7 +218,8 @@ def test_postgres_conversions(started_cluster):
         "[[[[NULL]]]]\t"
         "[]\t"
         "['2a0c0bfc-4fec-4e32-ae3a-7fc8eea6626a','42209d53-d641-4d73-a8b6-c038db1e75d6',NULL]\t"
-        "[[NULL,'42209d53-d641-4d73-a8b6-c038db1e75d6'],['2a0c0bfc-4fec-4e32-ae3a-7fc8eea6626a',NULL],[NULL,NULL]]\n"
+        "[[NULL,'42209d53-d641-4d73-a8b6-c038db1e75d6'],['2a0c0bfc-4fec-4e32-ae3a-7fc8eea6626a',NULL],[NULL,NULL]]\t"
+        "[42,42,42]\n"
     )
     assert result == expected
 
@@ -199,6 +227,66 @@ def test_postgres_conversions(started_cluster):
     cursor.execute(f"DROP TABLE test_array_dimensions")
 
 
+def test_postgres_array_ndim_error_messges(started_cluster):
+    cursor = started_cluster.postgres_conn.cursor()
+
+    # cleanup
+    cursor.execute("DROP VIEW  IF EXISTS array_ndim_view;")
+    cursor.execute("DROP TABLE IF EXISTS array_ndim_table;")
+
+    # setup
+    cursor.execute(
+        'CREATE TABLE array_ndim_table (x INTEGER, "Mixed-case with spaces" INTEGER[]);'
+    )
+    cursor.execute("CREATE VIEW  array_ndim_view AS SELECT * FROM array_ndim_table;")
+    describe_table = """
+    DESCRIBE TABLE postgresql(
+        'postgres1:5432', 'postgres', 'array_ndim_view',
+        'postgres', 'mysecretpassword'
+    )
+    """
+
+    # View with array column cannot be empty. Should throw a useful error message.
+    # (Cannot infer array dimension.)
+    try:
+        node1.query(describe_table)
+        assert False
+    except Exception as error:
+        assert (
+            "PostgreSQL relation containing arrays cannot be empty: array_ndim_view"
+            in str(error)
+        )
+
+    # View cannot have empty array. Should throw useful error message.
+    # (Cannot infer array dimension.)
+    cursor.execute("TRUNCATE array_ndim_table;")
+    cursor.execute("INSERT INTO array_ndim_table VALUES (1234, '{}');")
+    try:
+        node1.query(describe_table)
+        assert False
+    except Exception as error:
+        assert (
+            'PostgreSQL cannot infer dimensions of an empty array: array_ndim_view."Mixed-case with spaces"'
+            in str(error)
+        )
+
+    # View cannot have NULL array value. Should throw useful error message.
+    cursor.execute("TRUNCATE array_ndim_table;")
+    cursor.execute("INSERT INTO array_ndim_table VALUES (1234, NULL);")
+    try:
+        node1.query(describe_table)
+        assert False
+    except Exception as error:
+        assert (
+            'PostgreSQL array cannot be NULL: array_ndim_view."Mixed-case with spaces"'
+            in str(error)
+        )
+
+    # cleanup
+    cursor.execute("DROP VIEW  IF EXISTS array_ndim_view;")
+    cursor.execute("DROP TABLE IF EXISTS array_ndim_table;")
+
+
 def test_non_default_schema(started_cluster):
     node1.query("DROP TABLE IF EXISTS test_pg_table_schema")
     node1.query("DROP TABLE IF EXISTS test_pg_table_schema_with_dots")
diff --git a/tests/integration/test_storage_s3/test.py b/tests/integration/test_storage_s3/test.py
index f5c6f54a1ea..2549cb0d473 100644
--- a/tests/integration/test_storage_s3/test.py
+++ b/tests/integration/test_storage_s3/test.py
@@ -626,7 +626,7 @@ def test_wrong_s3_syntax(started_cluster):
     instance = started_cluster.instances["dummy"]  # type: ClickHouseInstance
     expected_err_msg = "Code: 42"  # NUMBER_OF_ARGUMENTS_DOESNT_MATCH
 
-    query = "create table test_table_s3_syntax (id UInt32) ENGINE = S3('', '', '', '', '', '')"
+    query = "create table test_table_s3_syntax (id UInt32) ENGINE = S3('', '', '', '', '', '', '')"
     assert expected_err_msg in instance.query_and_get_error(query)
 
     expected_err_msg = "Code: 36"  # BAD_ARGUMENTS
@@ -1395,6 +1395,7 @@ def test_schema_inference_from_globs(started_cluster):
 
 
 def test_signatures(started_cluster):
+    session_token = "session token that will not be checked by MiniIO"
     bucket = started_cluster.minio_bucket
     instance = started_cluster.instances["dummy"]
 
@@ -1417,6 +1418,11 @@ def test_signatures(started_cluster):
     )
     assert int(result) == 1
 
+    result = instance.query(
+        f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}')"
+    )
+    assert int(result) == 1
+
     result = instance.query(
         f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'Arrow', 'x UInt64', 'auto')"
     )
@@ -1427,6 +1433,21 @@ def test_signatures(started_cluster):
     )
     assert int(result) == 1
 
+    result = instance.query(
+        f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}', 'Arrow')"
+    )
+    assert int(result) == 1
+
+    lt = instance.query(
+        f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}', 'Arrow', 'x UInt64')"
+    )
+    assert int(result) == 1
+
+    lt = instance.query(
+        f"select * from s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test.arrow', 'minio', 'minio123', '{session_token}', 'Arrow', 'x UInt64', 'auto')"
+    )
+    assert int(result) == 1
+
 
 def test_select_columns(started_cluster):
     bucket = started_cluster.minio_bucket
@@ -2111,3 +2132,65 @@ def test_filtering_by_file_or_path(started_cluster):
     )
 
     assert int(result) == 1
+
+
+def test_union_schema_inference_mode(started_cluster):
+    bucket = started_cluster.minio_bucket
+    instance = started_cluster.instances["s3_non_default"]
+
+    instance.query(
+        f"insert into function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference1.jsonl') select 1 as a"
+    )
+
+    instance.query(
+        f"insert into function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference2.jsonl') select 2 as b"
+    )
+
+    instance.query(
+        f"insert into function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference3.jsonl') select 2 as c"
+    )
+
+    instance.query(
+        f"insert into function s3('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference4.jsonl', TSV) select 'Error'"
+    )
+
+    for engine in ["s3", "url"]:
+        instance.query("system drop schema cache for s3")
+
+        result = instance.query(
+            f"desc {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference{{1,2,3}}.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+        )
+        assert result == "a\tNullable(Int64)\nb\tNullable(Int64)\nc\tNullable(Int64)\n"
+
+        result = instance.query(
+            "select schema_inference_mode, splitByChar('/', source)[-1] as file, schema from system.schema_inference_cache where source like '%test_union_schema_inference%' order by file format TSV"
+        )
+        assert (
+            result == "UNION\ttest_union_schema_inference1.jsonl\ta Nullable(Int64)\n"
+            "UNION\ttest_union_schema_inference2.jsonl\tb Nullable(Int64)\n"
+            "UNION\ttest_union_schema_inference3.jsonl\tc Nullable(Int64)\n"
+        )
+        result = instance.query(
+            f"select * from {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference{{1,2,3}}.jsonl') order by tuple(*) settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+        )
+        assert result == "1\t\\N\t\\N\n" "\\N\t2\t\\N\n" "\\N\t\\N\t2\n"
+
+        instance.query(f"system drop schema cache for {engine}")
+        result = instance.query(
+            f"desc {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference2.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+        )
+        assert result == "b\tNullable(Int64)\n"
+
+        result = instance.query(
+            f"desc {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference{{1,2,3}}.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+        )
+        assert (
+            result == "a\tNullable(Int64)\n"
+            "b\tNullable(Int64)\n"
+            "c\tNullable(Int64)\n"
+        )
+
+        error = instance.query_and_get_error(
+            f"desc {engine}('http://{started_cluster.minio_host}:{started_cluster.minio_port}/{bucket}/test_union_schema_inference{{1,2,3,4}}.jsonl') settings schema_inference_mode='union', describe_compact_output=1 format TSV"
+        )
+        assert "Cannot extract table structure" in error
diff --git a/tests/integration/test_storage_s3_queue/configs/users.xml b/tests/integration/test_storage_s3_queue/configs/users.xml
index 8e447278752..1c096c7da8f 100644
--- a/tests/integration/test_storage_s3_queue/configs/users.xml
+++ b/tests/integration/test_storage_s3_queue/configs/users.xml
@@ -2,7 +2,6 @@
     <profiles>
         <default>
             <stream_like_engine_allow_direct_select>1</stream_like_engine_allow_direct_select>
-            <allow_experimental_s3queue>1</allow_experimental_s3queue>
             <s3queue_enable_logging_to_s3queue_log>1</s3queue_enable_logging_to_s3queue_log>
         </default>
     </profiles>
diff --git a/tests/integration/test_storage_s3_queue/test.py b/tests/integration/test_storage_s3_queue/test.py
index b1163a549b1..b83c095a7a6 100644
--- a/tests/integration/test_storage_s3_queue/test.py
+++ b/tests/integration/test_storage_s3_queue/test.py
@@ -919,4 +919,6 @@ def test_drop_table(started_cluster):
     node.query(f"DROP TABLE {table_name} SYNC")
     assert node.contains_in_log(
         f"StorageS3Queue ({table_name}): Table is being dropped"
+    ) or node.contains_in_log(
+        f"StorageS3Queue ({table_name}): Shutdown was called, stopping sync"
     )
diff --git a/tests/integration/test_system_logs_hostname/__init__.py b/tests/integration/test_system_logs_hostname/__init__.py
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/integration/test_system_logs_hostname/configs/replicated_servers.xml b/tests/integration/test_system_logs_hostname/configs/replicated_servers.xml
new file mode 100644
index 00000000000..584edf41004
--- /dev/null
+++ b/tests/integration/test_system_logs_hostname/configs/replicated_servers.xml
@@ -0,0 +1,34 @@
+<clickhouse>
+	<remote_servers>
+		<test_cluster>
+			<shard>
+				<internal_replication>true</internal_replication>
+				<replica>
+					<host>node1</host>
+					<port>9000</port>
+				</replica>
+				<replica>
+					<host>node2</host>
+					<port>9000</port>
+				</replica>
+				<replica>
+					<host>node3</host>
+					<port>9000</port>
+				</replica>
+			</shard>
+		</test_cluster>
+	</remote_servers>
+	<query_log>
+		<database>system</database>
+		<table>query_log</table>
+		<partition_by>toYYYYMM(event_date)</partition_by>
+		<ttl>event_date + INTERVAL 30 DAY DELETE</ttl>
+		<!--
+        <engine>ENGINE = MergeTree PARTITION BY toYYYYMM(event_date) ORDER BY (event_date, event_time) SETTINGS index_granularity = 1024</engine>
+        -->
+		<flush_interval_milliseconds>100</flush_interval_milliseconds>
+		<reserved_size_rows>8192</reserved_size_rows>
+		<buffer_size_rows_flush_threshold>524288</buffer_size_rows_flush_threshold>
+		<flush_on_crash>false</flush_on_crash>
+	</query_log>
+</clickhouse>
diff --git a/tests/integration/test_system_logs_hostname/test_replicated.py b/tests/integration/test_system_logs_hostname/test_replicated.py
new file mode 100644
index 00000000000..b9db6b03673
--- /dev/null
+++ b/tests/integration/test_system_logs_hostname/test_replicated.py
@@ -0,0 +1,71 @@
+import pytest
+from helpers.cluster import ClickHouseCluster
+
+
+def fill_nodes(nodes, shard):
+    for node in nodes:
+        node.query(
+            """
+                CREATE DATABASE test;
+    
+                CREATE TABLE test.test_table(date Date, id UInt32)
+                ENGINE = ReplicatedMergeTree('/clickhouse/tables/test/{shard}/replicated/test_table', '{replica}') ORDER BY id PARTITION BY toYYYYMM(date);
+            """.format(
+                shard=shard, replica=node.name
+            )
+        )
+
+
+cluster = ClickHouseCluster(__file__)
+node1 = cluster.add_instance(
+    "node1", with_zookeeper=True, main_configs=["configs/replicated_servers.xml"]
+)
+node2 = cluster.add_instance(
+    "node2", with_zookeeper=True, main_configs=["configs/replicated_servers.xml"]
+)
+node3 = cluster.add_instance(
+    "node3", with_zookeeper=True, main_configs=["configs/replicated_servers.xml"]
+)
+
+
+@pytest.fixture(scope="module")
+def start_cluster():
+    try:
+        cluster.start()
+
+        fill_nodes([node1, node2, node3], 1)
+
+        yield cluster
+
+    except Exception as ex:
+        print(ex)
+
+    finally:
+        cluster.shutdown()
+
+
+def test_truncate_database_replicated(start_cluster):
+    node1.query("SELECT 1", query_id="query_node1")
+    node2.query("SELECT 1", query_id="query_node2")
+    node3.query("SELECT 1", query_id="query_node3")
+    node1.query("SYSTEM FLUSH LOGS")
+    node2.query("SYSTEM FLUSH LOGS")
+    node3.query("SYSTEM FLUSH LOGS")
+    assert (
+        node1.query(
+            "SELECT hostname from system.query_log  where query_id='query_node1' LIMIT 1"
+        )
+        == "node1\n"
+    )
+    assert (
+        node2.query(
+            "SELECT hostname from system.query_log  where query_id='query_node2' LIMIT 1"
+        )
+        == "node2\n"
+    )
+    assert (
+        node3.query(
+            "SELECT hostname from system.query_log  where query_id='query_node3' LIMIT 1"
+        )
+        == "node3\n"
+    )
diff --git a/tests/integration/test_system_start_stop_listen/configs/client.xml b/tests/integration/test_system_start_stop_listen/configs/client.xml
new file mode 100644
index 00000000000..15d83a7b1ab
--- /dev/null
+++ b/tests/integration/test_system_start_stop_listen/configs/client.xml
@@ -0,0 +1,10 @@
+<clickhouse>
+    <openSSL>
+        <client>
+            <verificationMode>none</verificationMode>
+            <invalidCertificateHandler>
+                <name>AcceptCertificateHandler</name>
+            </invalidCertificateHandler>
+        </client>
+    </openSSL>
+</clickhouse>
diff --git a/tests/integration/test_system_start_stop_listen/configs/protocols.xml b/tests/integration/test_system_start_stop_listen/configs/protocols.xml
index 1d8608bcaca..f2cef35a6ec 100644
--- a/tests/integration/test_system_start_stop_listen/configs/protocols.xml
+++ b/tests/integration/test_system_start_stop_listen/configs/protocols.xml
@@ -5,6 +5,14 @@
     <tcp_port>9000</tcp_port>
     <http_port>8123</http_port>
     <mysql_port>9004</mysql_port>
+    <tcp_port_secure>9440</tcp_port_secure>
+
+    <openSSL>
+        <server>
+            <certificateFile>/etc/clickhouse-server/config.d/server.crt</certificateFile>
+            <privateKeyFile>/etc/clickhouse-server/config.d/server.key</privateKeyFile>
+        </server>
+    </openSSL>
 
     <!-- Custom protocols -->
     <protocols>
diff --git a/tests/integration/test_system_start_stop_listen/configs/server.crt b/tests/integration/test_system_start_stop_listen/configs/server.crt
new file mode 100644
index 00000000000..6f4deca038f
--- /dev/null
+++ b/tests/integration/test_system_start_stop_listen/configs/server.crt
@@ -0,0 +1,18 @@
+-----BEGIN CERTIFICATE-----
+MIIC+zCCAeOgAwIBAgIJAIhI9ozZJ+TWMA0GCSqGSIb3DQEBCwUAMBQxEjAQBgNV
+BAMMCWxvY2FsaG9zdDAeFw0xOTA0MjIwNDMyNTJaFw0yMDA0MjEwNDMyNTJaMBQx
+EjAQBgNVBAMMCWxvY2FsaG9zdDCCASIwDQYJKoZIhvcNAQEBBQADggEPADCCAQoC
+ggEBAK+wVUEdqF2uXvN0MJBgnAHyXi6JTi4p/F6igsrCjSNjJWzHH0vQmK8ujfcF
+CkifW88i+W5eHctuEtQqNHK+t9x9YiZtXrj6m/XkOXs20mYgENSmbbbHbriTPnZB
+zZrq6UqMlwIHNNAa+I3NMORQxVRaI0ybXnGVO5elr70xHpk03xL0JWKHpEqYp4db
+2aBQgF6y3Ww4khxjIYqpUYXWXGFnVIRU7FKVEAM1xyKqvQzXjQ5sVM/wyHknveEF
+3b/X4ggN+KNl5KOc0cWDh1/XaatJAPaUUPqZcq76tynLbP64Xm3dxHcj+gtRkO67
+ef6MSg6l63m3XQP6Qb+MIkd06OsCAwEAAaNQME4wHQYDVR0OBBYEFDmODTO8QLDN
+ykR3x0LIOnjNhrKhMB8GA1UdIwQYMBaAFDmODTO8QLDNykR3x0LIOnjNhrKhMAwG
+A1UdEwQFMAMBAf8wDQYJKoZIhvcNAQELBQADggEBAAwaiJc7uqEpnH3aukbftDwX
+m8GfEnj1HVdgg+9GGNq+9rvUYBF6gdPmjRCX9dO0cclLFx8jc2org0rTSq9WoOhX
+E6qL4Eqrmc5SE3Y9jZM0h6GRD4oXK014FmtZ3T6ddZU3dQLj3BS2r1XrvmubTvGN
+ZuTJNY8nx8Hh6H5XINmsEjUF9E5hog+PwCE03xt2adIdYL+gsbxASeNYyeUFpZv5
+zcXR3VoakBWnAaOVgCHq2qh96QAnL7ZKzFkGf/MdwV10KU3dmb+ICbQUUdf9Gc17
+aaDCIRws312F433FdXBkGs2UkB7ZZme9dfn6O1QbeTNvex2VLMqYx/CTkfFbOQA=
+-----END CERTIFICATE-----
diff --git a/tests/integration/test_system_start_stop_listen/configs/server.key b/tests/integration/test_system_start_stop_listen/configs/server.key
new file mode 100644
index 00000000000..6eddb3295db
--- /dev/null
+++ b/tests/integration/test_system_start_stop_listen/configs/server.key
@@ -0,0 +1,28 @@
+-----BEGIN PRIVATE KEY-----
+MIIEvQIBADANBgkqhkiG9w0BAQEFAASCBKcwggSjAgEAAoIBAQCvsFVBHahdrl7z
+dDCQYJwB8l4uiU4uKfxeooLKwo0jYyVsxx9L0JivLo33BQpIn1vPIvluXh3LbhLU
+KjRyvrfcfWImbV64+pv15Dl7NtJmIBDUpm22x264kz52Qc2a6ulKjJcCBzTQGviN
+zTDkUMVUWiNMm15xlTuXpa+9MR6ZNN8S9CVih6RKmKeHW9mgUIBest1sOJIcYyGK
+qVGF1lxhZ1SEVOxSlRADNcciqr0M140ObFTP8Mh5J73hBd2/1+IIDfijZeSjnNHF
+g4df12mrSQD2lFD6mXKu+rcpy2z+uF5t3cR3I/oLUZDuu3n+jEoOpet5t10D+kG/
+jCJHdOjrAgMBAAECggEARF66zrxb6RkSmmt8+rKeA6PuQu3sHsr4C1vyyjUr97l9
+tvdGlpp20LWtSZQMjHZ3pARYTTsTHTeY3DgQcRcHNicVKx8k3ZepWeeW9vw+pL+V
+zSt3RsoVrH6gsCSrfr4sS3aqzX9AbjwQvh48CJ3mLQ1m70kHV+xbZIh1+4pB/hyP
+1wKyUE18ZkOptXvO/TtoHzLQCecpkXtWzmry1Eh2isvXA+NMrAtLibGsyM1mtm7i
+5ozevzHabvvCDBEe+KgZdONgVhhhvm2eOd+/s4w3rw4ETud4fI/ZAJyWXhiIKFnA
+VJbElWruSAoVBW7p2bsF5PbmVzvo8vXL+VylxYD+AQKBgQDhLoRKTVhNkn/QjKxq
+sdOh+QZra0LzjVpAmkQzu7wZMSHEz9qePQciDQQrYKrmRF1vNcIRCVUTqWYheJ/1
+lKRrCGa0ab6k96zkWMqLHD5u+UeJV7r1dJIx08ME9kNJ+x/XtB8klRIji16NiQUS
+qc6p8z0M2AnbJzsRfWZRH8FeYwKBgQDHu8dzdtVGI7MtxfPOE/bfajiopDg8BdTC
+pdug2T8XofRHRq7Q+0vYjTAZFT/slib91Pk6VvvPdo9VBZiL4omv4dAq6mOOdX/c
+U14mJe1X5GCrr8ExZ8BfNJ3t/6sV1fcxyJwAw7iBguqxA2JqdM/wFk10K8XqvzVn
+CD6O9yGt2QKBgFX1BMi8N538809vs41S7l9hCQNOQZNo/O+2M5yv6ECRkbtoQKKw
+1x03bMUGNJaLuELweXE5Z8GGo5bZTe5X3F+DKHlr+DtO1C+ieUaa9HY2MAmMdLCn
+2/qrREGLo+oEs4YKmuzC/taUp/ZNPKOAMISNdluFyFVg51pozPrgrVbTAoGBAKkE
+LBl3O67o0t0vH8sJdeVFG8EJhlS0koBMnfgVHqC++dm+5HwPyvTrNQJkyv1HaqNt
+r6FArkG3ED9gRuBIyT6+lctbIPgSUip9mbQqcBfqOCvQxGksZMur2ODncz09HLtS
+CUFUXjOqNzOnq4ZuZu/Bz7U4vXiSaXxQq6+LTUKxAoGAFZU/qrI06XxnrE9A1X0W
+l7DSkpZaDcu11NrZ473yONih/xOZNh4SSBpX8a7F6Pmh9BdtGqphML8NFPvQKcfP
+b9H2iid2tc292uyrUEb5uTMmv61zoTwtitqLzO0+tS6PT3fXobX+eyeEWKzPBljL
+HFtxG5CCXpkdnWRmaJnhTzA=
+-----END PRIVATE KEY-----
diff --git a/tests/integration/test_system_start_stop_listen/test.py b/tests/integration/test_system_start_stop_listen/test.py
index 84f75d66089..391cb757519 100644
--- a/tests/integration/test_system_start_stop_listen/test.py
+++ b/tests/integration/test_system_start_stop_listen/test.py
@@ -1,15 +1,23 @@
 #!/usr/bin/env python3
 
 
+import os
 import pytest
 from helpers.cluster import ClickHouseCluster
-from helpers.client import Client
+from helpers.client import Client, QueryRuntimeException
 import requests
 
+SCRIPT_DIR = os.path.dirname(os.path.realpath(__file__))
+
 cluster = ClickHouseCluster(__file__)
 main_node = cluster.add_instance(
     "main_node",
-    main_configs=["configs/cluster.xml", "configs/protocols.xml"],
+    main_configs=[
+        "configs/cluster.xml",
+        "configs/protocols.xml",
+        "configs/server.crt",
+        "configs/server.key",
+    ],
     with_zookeeper=True,
 )
 backup_node = cluster.add_instance(
@@ -36,11 +44,27 @@ def http_works(port=8123):
         return False
 
 
+def tcp_secure_works(port=9440):
+    client = Client(
+        main_node.ip_address,
+        port,
+        command=cluster.client_bin_path,
+        secure=True,
+        config=f"{SCRIPT_DIR}/configs/client.xml",
+    )
+    try:
+        client.query(QUERY)
+    except QueryRuntimeException:
+        return False
+    return True
+
+
 def assert_everything_works():
     custom_client = Client(main_node.ip_address, 9001, command=cluster.client_bin_path)
     main_node.query(QUERY)
     main_node.query(MYSQL_QUERY)
     custom_client.query(QUERY)
+    assert tcp_secure_works()
     assert http_works()
     assert http_works(8124)
 
@@ -68,6 +92,12 @@ def test_default_protocols(started_cluster):
     assert "Connections to mysql failed" in main_node.query_and_get_error(MYSQL_QUERY)
     main_node.query("SYSTEM START LISTEN MYSQL")
 
+    # TCP Secure
+    assert_everything_works()
+    main_node.query("SYSTEM STOP LISTEN TCP SECURE")
+    assert not tcp_secure_works()
+    main_node.query("SYSTEM START LISTEN TCP SECURE")
+
     assert_everything_works()
 
 
diff --git a/tests/integration/test_throttling/configs/users_overrides_persistent.xml b/tests/integration/test_throttling/configs/users_overrides_persistent.xml
new file mode 100644
index 00000000000..b25a656ddb1
--- /dev/null
+++ b/tests/integration/test_throttling/configs/users_overrides_persistent.xml
@@ -0,0 +1,7 @@
+<clickhouse>
+    <profiles>
+        <default>
+            <s3_disable_checksum>true</s3_disable_checksum>
+        </default>
+    </profiles>
+</clickhouse>
diff --git a/tests/integration/test_throttling/test.py b/tests/integration/test_throttling/test.py
index ba2e59170ce..04d02cc859d 100644
--- a/tests/integration/test_throttling/test.py
+++ b/tests/integration/test_throttling/test.py
@@ -38,7 +38,10 @@ node = cluster.add_instance(
         "configs/server_overrides.xml",
         "configs/ssl.xml",
     ],
-    user_configs=["configs/users_overrides.xml"],
+    user_configs=[
+        "configs/users_overrides.xml",
+        "configs/users_overrides_persistent.xml",
+    ],
     with_minio=True,
     minio_certs_dir="minio_certs",
 )
@@ -256,7 +259,7 @@ def assert_took(took, should_took):
             "user",
             "max_backup_bandwidth",
             "1M",
-            7 * 2,
+            7,
             id="user_local_to_remote_throttling",
         ),
         # reading 1e6*8 bytes with 2M default bandwith should take (8-2)/2=3 seconds
@@ -266,7 +269,7 @@ def assert_took(took, should_took):
             "server",
             "max_backup_bandwidth_for_server",
             "2M",
-            3 * 2,
+            3,
             id="server_local_to_remote_throttling",
         ),
     ],
diff --git a/tests/integration/test_ttl_move/test.py b/tests/integration/test_ttl_move/test.py
index 2f18a0a1afa..1df9bc6d3c9 100644
--- a/tests/integration/test_ttl_move/test.py
+++ b/tests/integration/test_ttl_move/test.py
@@ -302,7 +302,8 @@ def test_moves_work_after_storage_policy_change(started_cluster, name, engine):
         node1.query(
             """ALTER TABLE {name} MODIFY TTL now()-3600 TO DISK 'jbod1', d1 TO DISK 'external'""".format(
                 name=name
-            )
+            ),
+            settings={"allow_suspicious_ttl_expressions": 1},
         )
 
         wait_expire_1 = 12
diff --git a/tests/integration/test_user_valid_until/test.py b/tests/integration/test_user_valid_until/test.py
index e34771e55a9..d6d5bf8b18e 100644
--- a/tests/integration/test_user_valid_until/test.py
+++ b/tests/integration/test_user_valid_until/test.py
@@ -78,7 +78,9 @@ def test_details(started_cluster):
     # 2. Time only is not supported
     node.query("CREATE USER user_details_time_only VALID UNTIL '22:03:40'")
 
+    until_year = datetime.today().strftime("%Y")
+
     assert (
         node.query("SHOW CREATE USER user_details_time_only")
-        == "CREATE USER user_details_time_only VALID UNTIL \\'2023-01-01 22:03:40\\'\n"
+        == f"CREATE USER user_details_time_only VALID UNTIL \\'{until_year}-01-01 22:03:40\\'\n"
     )
diff --git a/tests/integration/test_wrong_db_or_table_name/test.py b/tests/integration/test_wrong_db_or_table_name/test.py
index 68af383b6c3..641501eac84 100644
--- a/tests/integration/test_wrong_db_or_table_name/test.py
+++ b/tests/integration/test_wrong_db_or_table_name/test.py
@@ -61,6 +61,7 @@ def test_wrong_table_name(start):
     node.query(
         """
         CREATE DATABASE test;
+        CREATE DATABASE test2;
         CREATE TABLE test.table_test (i Int64) ENGINE=Memory;
         CREATE TABLE test.table_test2 (i Int64) ENGINE=Memory;
         INSERT INTO test.table_test SELECT 1;
@@ -68,7 +69,7 @@ def test_wrong_table_name(start):
     )
     with pytest.raises(
         QueryRuntimeException,
-        match="DB::Exception: Table test.table_test1 does not exist. Maybe you meant table_test?.",
+        match="DB::Exception: Table test.table_test1 does not exist. Maybe you meant test.table_test?.",
     ):
         node.query(
             """
@@ -76,11 +77,23 @@ def test_wrong_table_name(start):
             """
         )
     assert int(node.query("SELECT count() FROM test.table_test;")) == 1
+
+    with pytest.raises(
+        QueryRuntimeException,
+        match="DB::Exception: Table test2.table_test1 does not exist. Maybe you meant test.table_test?.",
+    ):
+        node.query(
+            """
+            SELECT * FROM test2.table_test1 LIMIT 1;
+            """
+        )
+
     node.query(
         """
             DROP TABLE test.table_test;
             DROP TABLE test.table_test2;
             DROP DATABASE test;
+            DROP DATABASE test2;
             """
     )
 
@@ -89,6 +102,7 @@ def test_drop_wrong_table_name(start):
     node.query(
         """
         CREATE DATABASE test;
+        CREATE DATABASE test2;
         CREATE TABLE test.table_test (i Int64) ENGINE=Memory;
         INSERT INTO test.table_test SELECT 1;
         """
@@ -96,13 +110,21 @@ def test_drop_wrong_table_name(start):
 
     with pytest.raises(
         QueryRuntimeException,
-        match="DB::Exception: Table test.table_tes does not exist. Maybe you meant table_test?.",
+        match="DB::Exception: Table test.table_test1 does not exist. Maybe you meant test.table_test?.",
     ):
-        node.query("DROP TABLE test.table_tes;")
+        node.query("DROP TABLE test.table_test1;")
     assert int(node.query("SELECT count() FROM test.table_test;")) == 1
+
+    with pytest.raises(
+        QueryRuntimeException,
+        match="DB::Exception: Table test2.table_test does not exist. Maybe you meant test.table_test?.",
+    ):
+        node.query("DROP TABLE test2.table_test;")
+
     node.query(
         """
         DROP TABLE test.table_test;
         DROP DATABASE test;
+        DROP DATABASE test2;
         """
     )
diff --git a/tests/performance/README.md b/tests/performance/README.md
index f554e96203b..289ecaba034 100644
--- a/tests/performance/README.md
+++ b/tests/performance/README.md
@@ -18,5 +18,5 @@ TODO @akuzm
 
 ```
 pip3 install clickhouse_driver scipy
-../../docker/test/performance-comparison/perf.py --runs 1 insert_parallel.xml
+../../tests/performance/scripts/perf.py --runs 1 insert_parallel.xml
 ```
diff --git a/tests/performance/encrypt_decrypt.xml b/tests/performance/encrypt_decrypt.xml
deleted file mode 100644
index 209be78f8b4..00000000000
--- a/tests/performance/encrypt_decrypt.xml
+++ /dev/null
@@ -1,68 +0,0 @@
-<test>
-  <!-- "Strict" mode (key and iv length checks), non-empty plaintext.
-  See also other encrypt_decrypt_*.xml for more cases. -->
-
-    <substitutions>
-        <substitution>
-          <name>func</name>
-          <values>
-              <!-- materialize(plaitext) is to avoid all-args-are-const optimization, resulting in executing function exactly once. -->
-              <value>encrypt('aes-128-cbc', materialize(plaintext), key16, iv16)</value>
-              <value>encrypt('aes-128-ctr', materialize(plaintext), key16, iv16)</value>
-              <value>encrypt('aes-128-ecb', materialize(plaintext), key16)</value>
-              <value>encrypt('aes-128-ofb', materialize(plaintext), key16, iv16)</value>
-              <value>encrypt('aes-128-gcm', materialize(plaintext), key16, iv12, 'aadaadaadaad')</value>
-
-              <value>encrypt('aes-192-cbc', materialize(plaintext), key24, iv16)</value>
-              <value>encrypt('aes-192-ctr', materialize(plaintext), key24, iv16)</value>
-              <value>encrypt('aes-192-ecb', materialize(plaintext), key24)</value>
-              <value>encrypt('aes-192-ofb', materialize(plaintext), key24, iv16)</value>
-              <value>encrypt('aes-192-gcm', materialize(plaintext), key24, iv12, 'aadaadaadaad')</value>
-
-              <value>encrypt('aes-256-cbc', materialize(plaintext), key32, iv16)</value>
-              <value>encrypt('aes-256-ctr', materialize(plaintext), key32, iv16)</value>
-              <value>encrypt('aes-256-ecb', materialize(plaintext), key32)</value>
-              <value>encrypt('aes-256-ofb', materialize(plaintext), key32, iv16)</value>
-              <value>encrypt('aes-256-gcm', materialize(plaintext), key32, iv12, 'aadaadaadaad')</value>
-
-              <!-- decrypt + encrypt since it is really hard to compose decrypt-only case -->
-              <value>decrypt('aes-128-cbc', encrypt('aes-128-cbc', materialize(plaintext), key16, iv16), key16, iv16)</value>
-              <value>decrypt('aes-128-ctr', encrypt('aes-128-ctr', materialize(plaintext), key16, iv16), key16, iv16)</value>
-              <value>decrypt('aes-128-ecb', encrypt('aes-128-ecb', materialize(plaintext), key16), key16)</value>
-              <value>decrypt('aes-128-ofb', encrypt('aes-128-ofb', materialize(plaintext), key16, iv16), key16, iv16)</value>
-              <value>decrypt('aes-128-gcm', encrypt('aes-128-gcm', materialize(plaintext), key16, iv12, 'aadaadaadaad'), key16, iv12, 'aadaadaadaad')</value>
-
-              <value>decrypt('aes-192-cbc', encrypt('aes-192-cbc', materialize(plaintext), key24, iv16), key24, iv16)</value>
-              <value>decrypt('aes-192-ctr', encrypt('aes-192-ctr', materialize(plaintext), key24, iv16), key24, iv16)</value>
-              <value>decrypt('aes-192-ecb', encrypt('aes-192-ecb', materialize(plaintext), key24), key24)</value>
-              <value>decrypt('aes-192-ofb', encrypt('aes-192-ofb', materialize(plaintext), key24, iv16), key24, iv16)</value>
-              <value>decrypt('aes-192-gcm', encrypt('aes-192-gcm', materialize(plaintext), key24, iv12, 'aadaadaadaad'), key24, iv12, 'aadaadaadaad')</value>
-
-              <value>decrypt('aes-256-cbc', encrypt('aes-256-cbc', materialize(plaintext), key32, iv16), key32, iv16)</value>
-              <value>decrypt('aes-256-ctr', encrypt('aes-256-ctr', materialize(plaintext), key32, iv16), key32, iv16)</value>
-              <value>decrypt('aes-256-ecb', encrypt('aes-256-ecb', materialize(plaintext), key32), key32)</value>
-              <value>decrypt('aes-256-ofb', encrypt('aes-256-ofb', materialize(plaintext), key32, iv16), key32, iv16)</value>
-              <value>decrypt('aes-256-gcm', encrypt('aes-256-gcm', materialize(plaintext), key32, iv12, 'aadaadaadaad'), key32, iv12, 'aadaadaadaad')</value>
-
-           </values>
-        </substitution>
-        <substitution>
-           <name>table</name>
-           <values>
-               <value>numbers(2000000)</value>
-           </values>
-        </substitution>
-        <substitution>
-           <name>plaintext</name>
-           <values>
-              <value>'paintext'</value>
-              <value>'\x12\x2B\xF9\x16\x93\xA4\xD6\x74\x22\xD9\x17\x5E\x38\xCD\x1D\x7B\xB0\x12\xEC\x43\x6B\xC7\x76\xFD\xA1\xA2\x4E\xFC\xBC\x19\x92\x3A\x12\x8B\xD4\xB3\x62\xA8\x9D\xBB\x3E\x0C\x08\x12\x67\x20\x7D\x02\x58\xCF\xE7\xD6\x06\xB8\xB0\x14\x0A\x70\xA1\x81\x94\x14\x24\x74'</value>
-           </values>
-        </substitution>
-    </substitutions>
-
-    <!-- allow OpenSSL-related code load ciphers and warm-up -->
-    <fill_query>WITH {plaintext} as plaintext, repeat('k', 32) as key32, substring(key32, 1, 24) as key24, substring(key32, 1, 16) as key16, repeat('iv', 8) as iv16, substring(iv16, 1, 12) as iv12 SELECT count() FROM {table} WHERE NOT ignore({func}) LIMIT 1</fill_query>
-
-    <query>WITH {plaintext} as plaintext, repeat('k', 32) as key32, substring(key32, 1, 24) as key24, substring(key32, 1, 16) as key16, repeat('iv', 8) as iv16, substring(iv16, 1, 12) as iv12 SELECT count() FROM {table} WHERE NOT ignore({func})</query>
-</test>
diff --git a/tests/performance/group_array_sorted.xml b/tests/performance/group_array_sorted.xml
deleted file mode 100644
index d5887998341..00000000000
--- a/tests/performance/group_array_sorted.xml
+++ /dev/null
@@ -1,31 +0,0 @@
-<test>
-    <settings>
-        <max_memory_usage>30000000000</max_memory_usage>
-    </settings>
-
-    <substitutions>
-        <substitution>
-            <name>millions</name>
-            <values>
-                <value>50</value>
-                <value>100</value>
-            </values>
-        </substitution>
-        <substitution>
-            <name>window</name>
-            <values>
-                <value>10</value>
-                <value>1000</value>
-                <value>10000</value>
-            </values>
-        </substitution>
-    </substitutions>
-
-    <create_query>create table sorted_{millions}m engine MergeTree order by k as select number % 100 k, rand() v from numbers_mt(1000000 * {millions})</create_query>
-    <create_query>optimize table sorted_{millions}m final</create_query>
-
-    <query>select k, groupArraySorted({window})(v) from sorted_{millions}m group by k format Null</query>
-    <query>select k % 10 kk, groupArraySorted({window})(v) from sorted_{millions}m group by kk format Null</query>
-
-    <drop_query>drop table if exists sorted_{millions}m</drop_query>
-</test>
diff --git a/tests/performance/group_by_consecutive_keys.xml b/tests/performance/group_by_consecutive_keys.xml
new file mode 100644
index 00000000000..c5c885d2bb6
--- /dev/null
+++ b/tests/performance/group_by_consecutive_keys.xml
@@ -0,0 +1,8 @@
+<test>
+    <query>SELECT toUInt64(intDiv(number, 1000000)) AS n, count(), sum(number) FROM numbers(10000000) GROUP BY n FORMAT Null</query>
+    <query>SELECT toString(intDiv(number, 1000000)) AS n, count(), sum(number) FROM numbers(10000000) GROUP BY n FORMAT Null</query>
+    <query>SELECT toUInt64(intDiv(number, 1000000)) AS n, count(), uniq(number) FROM numbers(10000000) GROUP BY n FORMAT Null</query>
+    <query>SELECT toUInt64(intDiv(number, 100000)) AS n, count(), sum(number) FROM numbers(10000000) GROUP BY n FORMAT Null</query>
+    <query>SELECT toUInt64(intDiv(number, 100)) AS n, count(), sum(number) FROM numbers(10000000) GROUP BY n FORMAT Null</query>
+    <query>SELECT toUInt64(intDiv(number, 10)) AS n, count(), sum(number) FROM numbers(10000000) GROUP BY n FORMAT Null</query>
+</test>
diff --git a/tests/performance/hashjoin_with_large_output.xml b/tests/performance/hashjoin_with_large_output.xml
new file mode 100644
index 00000000000..f4b61c15f82
--- /dev/null
+++ b/tests/performance/hashjoin_with_large_output.xml
@@ -0,0 +1,64 @@
+<test>
+    <settings>
+        <max_threads>16</max_threads>
+        <max_memory_usage>10G</max_memory_usage>
+    </settings>
+
+    <substitutions>
+        <substitution>
+            <name>settings</name>
+            <values>
+                <value>join_algorithm='hash'</value>
+                <value>join_algorithm='grace_hash'</value>
+            </values>
+        </substitution>
+    </substitutions>
+
+    <create_query>
+        create table test_left
+        (
+        k1 String,
+        v1 String
+        )
+        engine = Memory();
+    </create_query>
+    <create_query>
+        create table test_right
+        (
+        k1 String,
+        v1 String,
+        v2 String,
+        v3 String,
+        v4 String,
+        v5 String,
+        v6 String,
+        v7 String,
+        v8 String,
+        v9 String
+        )
+        engine = Memory();
+    </create_query>
+    <fill_query>insert into test_left SELECT toString(number % 20), toString(number) from system.numbers limit 10000;</fill_query>
+    <fill_query>
+        insert into test_right
+        SELECT
+        toString(number % 20),
+        toString(number * 10000),
+        toString(number * 10000 + 1),
+        toString(number * 10000 + 2),
+        toString(number * 10000 + 3),
+        toString(number * 10000 + 4),
+        toString(number * 10000 + 5),
+        toString(number * 10000 + 6),
+        toString(number * 10000 + 7),
+        toString(number * 10000 + 8)
+        from system.numbers limit 10000;
+    </fill_query>
+
+    <query>
+        select * from test_left all inner join test_right on test_left.k1 = test_right.k1  SETTINGS {settings} format Null
+    </query>
+
+    <drop_query>DROP TABLE IF EXISTS test_left</drop_query>
+    <drop_query>DROP TABLE IF EXISTS test_right</drop_query>
+</test>
diff --git a/tests/performance/if.xml b/tests/performance/if.xml
new file mode 100644
index 00000000000..f4d0e8f9773
--- /dev/null
+++ b/tests/performance/if.xml
@@ -0,0 +1,12 @@
+<test>
+
+<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() > 42949673, zero + 1, zero + 2)) ]]></query>
+<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 3865470566, zero + 1, zero + 2)) ]]></query>
+<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 2147483647, zero + 1, zero + 2)) ]]></query>
+<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, zero + 2)) ]]></query>
+
+<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, zero + 1, 2)) ]]></query>
+<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, zero + 2)) ]]></query>
+<query><![CDATA[ SELECT count() FROM zeros(1000000000) WHERE NOT ignore(if(rand32() < 42949673, 1, 2)) ]]></query>
+
+</test>
diff --git a/docker/test/performance-comparison/README.md b/tests/performance/scripts/README.md
similarity index 93%
rename from docker/test/performance-comparison/README.md
rename to tests/performance/scripts/README.md
index fd9001e23c7..0a0580c62a0 100644
--- a/docker/test/performance-comparison/README.md
+++ b/tests/performance/scripts/README.md
@@ -25,7 +25,7 @@ The check status summarizes the report in a short text message like `1 faster, 1
 * `1 unstable` -- how many queries have unstable results,
 * `1 errors` -- how many errors there are in total. Action is required for every error, this number must be zero. The number of errors includes slower tests, tests that are too long, errors while running the tests and building reports, etc. Please look at the main report page to investigate these errors.
 
-The report page itself constists of a several tables. Some of them always signify errors, e.g. "Run errors" -- the very presence of this table indicates that there were errors during the test, that are not normal and must be fixed. Some tables are mostly informational, e.g. "Test times" -- they reflect normal test results. But if a cell in such table is marked in red, this also means an error, e.g., a test is taking too long to run.
+The report page itself consists of a several tables. Some of them always signify errors, e.g. "Run errors" -- the very presence of this table indicates that there were errors during the test, that are not normal and must be fixed. Some tables are mostly informational, e.g. "Test times" -- they reflect normal test results. But if a cell in such table is marked in red, this also means an error, e.g., a test is taking too long to run.
 
 #### Tested Commits
 Informational, no action required. Log messages for the commits that are tested. Note that for the right commit, we show nominal tested commit `pull/*/head` and real tested commit `pull/*/merge`, which is generated by GitHub by merging latest master to the `pull/*/head` and which we actually build and test in CI.
@@ -33,12 +33,12 @@ Informational, no action required. Log messages for the commits that are tested.
 #### Error Summary
 Action required for every item.
 
-This table summarizes all errors that ocurred during the test. Click the links to go to the description of a particular error.
+This table summarizes all errors that occurred during the test. Click the links to go to the description of a particular error.
 
 #### Run Errors
 Action required for every item -- these are errors that must be fixed.
 
-The errors that ocurred when running some test queries. For more information about the error, download test output archive and see `test-name-err.log`. To reproduce, see 'How to run' below.
+The errors that occurred when running some test queries. For more information about the error, download test output archive and see `test-name-err.log`. To reproduce, see 'How to run' below.
 
 #### Slow on Client
 Action required for every item -- these are errors that must be fixed.
@@ -65,7 +65,7 @@ You can find flame graphs for queries with performance changes in the test outpu
 #### Unstable Queries
 Action required for the cells marked in red.
 
-These are the queries for which we did not observe a statistically significant change in performance, but for which the variance in query performance is very high. This means that we are likely to observe big changes in performance even in the absence of real changes, e.g. when comparing the server to itself. Such queries are going to have bad sensitivity as performance tests -- if a query has, say, 50% expected variability, this means we are going to see changes in performance up to 50%, even when there were no real changes in the code. And because of this, we won't be able to detect changes less than 50% with such a query, which is pretty bad. The reasons for the high variability must be investigated and fixed; ideally, the variability should be brought under 5-10%. 
+These are the queries for which we did not observe a statistically significant change in performance, but for which the variance in query performance is very high. This means that we are likely to observe big changes in performance even in the absence of real changes, e.g. when comparing the server to itself. Such queries are going to have bad sensitivity as performance tests -- if a query has, say, 50% expected variability, this means we are going to see changes in performance up to 50%, even when there were no real changes in the code. And because of this, we won't be able to detect changes less than 50% with such a query, which is pretty bad. The reasons for the high variability must be investigated and fixed; ideally, the variability should be brought under 5-10%.
 
 The most frequent reason for instability is that the query is just too short -- e.g. below 0.1 seconds. Bringing query time to 0.2 seconds or above usually helps.
 Other reasons may include:
@@ -88,7 +88,7 @@ This table summarizes the changes in performance of queries in each test -- how
 Action required for the cells marked in red.
 
 This table shows the run times for all the tests. You may have to fix two kinds of errors in this table:
-1) Average query run time is too long -- probalby means that the preparatory steps such as creating the table and filling them with data are taking too long. Try to make them faster.
+1) Average query run time is too long -- probably means that the preparatory steps such as creating the table and filling them with data are taking too long. Try to make them faster.
 2) Longest query run time is too long -- some particular queries are taking too long, try to make them faster. The ideal query run time is between 0.1 and 1 s.
 
 #### Metric Changes
@@ -186,4 +186,4 @@ analytically, but I don't know enough math to do it. It would be something
 close to Wilcoxon test distribution.
 
 ### References
-1\. Box, Hunter, Hunter "Statictics for exprerimenters", p. 78: "A Randomized Design Used in the Comparison of Standard and Modified Fertilizer Mixtures for Tomato Plants."
+1\. Box, Hunter, Hunter "Statistics for exprerimenters", p. 78: "A Randomized Design Used in the Comparison of Standard and Modified Fertilizer Mixtures for Tomato Plants."
diff --git a/docker/test/performance-comparison/compare-releases.sh b/tests/performance/scripts/compare-releases.sh
similarity index 99%
rename from docker/test/performance-comparison/compare-releases.sh
rename to tests/performance/scripts/compare-releases.sh
index dc7681815d4..6e982168fb1 100755
--- a/docker/test/performance-comparison/compare-releases.sh
+++ b/tests/performance/scripts/compare-releases.sh
@@ -79,4 +79,3 @@ run
 
 rm output.7z
 7z a output.7z ./*.{log,tsv,html,txt,rep,svg} {right,left}/{performance,db/preprocessed_configs}
-
diff --git a/docker/test/performance-comparison/compare.sh b/tests/performance/scripts/compare.sh
similarity index 98%
rename from docker/test/performance-comparison/compare.sh
rename to tests/performance/scripts/compare.sh
index f10236b7135..6d1a271355e 100755
--- a/docker/test/performance-comparison/compare.sh
+++ b/tests/performance/scripts/compare.sh
@@ -236,7 +236,7 @@ function run_tests
         fi
     fi
 
-    # For PRs w/o changes in test definitons, test only a subset of queries,
+    # For PRs w/o changes in test definitions, test only a subset of queries,
     # and run them less times. If the corresponding environment variables are
     # already set, keep those values.
     #
@@ -1220,15 +1220,23 @@ create table ci_checks engine File(TSVWithNamesAndTypes, 'ci-checks.tsv')
             0 test_duration_ms,
             'https://s3.amazonaws.com/clickhouse-test-reports/$PR_TO_TEST/$SHA_TO_TEST/${CLICKHOUSE_PERFORMANCE_COMPARISON_CHECK_NAME_PREFIX}/report.html#fail1' report_url
         union all
-            select test || ' #' || toString(query_index), 'slower' test_status, 0 test_duration_ms,
-                'https://s3.amazonaws.com/clickhouse-test-reports/$PR_TO_TEST/$SHA_TO_TEST/${CLICKHOUSE_PERFORMANCE_COMPARISON_CHECK_NAME_PREFIX}/report.html#changes-in-performance.'
-                    || test || '.' || toString(query_index) report_url
-            from queries where changed_fail != 0 and diff > 0
+            select
+                test || ' #' || toString(query_index) || '::' || test_desc_.1 test_name,
+                'slower' test_status,
+                test_desc_.2 test_duration_ms,
+                'https://s3.amazonaws.com/clickhouse-test-reports/$PR_TO_TEST/$SHA_TO_TEST/${CLICKHOUSE_PERFORMANCE_COMPARISON_CHECK_NAME_PREFIX}/report.html#changes-in-performance.' || test || '.' || toString(query_index) report_url
+            from queries
+            array join map('old', left, 'new', right) as test_desc_
+            where changed_fail != 0 and diff > 0
         union all
-            select test || ' #' || toString(query_index), 'unstable' test_status, 0 test_duration_ms,
-                'https://s3.amazonaws.com/clickhouse-test-reports/$PR_TO_TEST/$SHA_TO_TEST/${CLICKHOUSE_PERFORMANCE_COMPARISON_CHECK_NAME_PREFIX}/report.html#unstable-queries.'
-                    || test || '.' || toString(query_index) report_url
-            from queries where unstable_fail != 0
+            select
+                test || ' #' || toString(query_index) || '::' || test_desc_.1 test_name,
+                'unstable' test_status,
+                test_desc_.2 test_duration_ms,
+                'https://s3.amazonaws.com/clickhouse-test-reports/$PR_TO_TEST/$SHA_TO_TEST/${CLICKHOUSE_PERFORMANCE_COMPARISON_CHECK_NAME_PREFIX}/report.html#unstable-queries.' || test || '.' || toString(query_index) report_url
+            from queries
+            array join map('old', left, 'new', right) as test_desc_
+            where unstable_fail != 0
     )
 ;
     "
diff --git a/docker/test/performance-comparison/config/client_config.xml b/tests/performance/scripts/config/client_config.xml
similarity index 100%
rename from docker/test/performance-comparison/config/client_config.xml
rename to tests/performance/scripts/config/client_config.xml
diff --git a/docker/test/performance-comparison/config/config.d/top_level_domains_lists.xml b/tests/performance/scripts/config/config.d/top_level_domains_lists.xml
similarity index 100%
rename from docker/test/performance-comparison/config/config.d/top_level_domains_lists.xml
rename to tests/performance/scripts/config/config.d/top_level_domains_lists.xml
diff --git a/docker/test/performance-comparison/config/config.d/user_files.xml b/tests/performance/scripts/config/config.d/user_files.xml
similarity index 100%
rename from docker/test/performance-comparison/config/config.d/user_files.xml
rename to tests/performance/scripts/config/config.d/user_files.xml
diff --git a/docker/test/performance-comparison/config/config.d/zzz-perf-comparison-tweaks-config.xml b/tests/performance/scripts/config/config.d/zzz-perf-comparison-tweaks-config.xml
similarity index 100%
rename from docker/test/performance-comparison/config/config.d/zzz-perf-comparison-tweaks-config.xml
rename to tests/performance/scripts/config/config.d/zzz-perf-comparison-tweaks-config.xml
diff --git a/docker/test/performance-comparison/config/users.d/perf-comparison-tweaks-users.xml b/tests/performance/scripts/config/users.d/perf-comparison-tweaks-users.xml
similarity index 100%
rename from docker/test/performance-comparison/config/users.d/perf-comparison-tweaks-users.xml
rename to tests/performance/scripts/config/users.d/perf-comparison-tweaks-users.xml
diff --git a/docker/test/performance-comparison/download.sh b/tests/performance/scripts/download.sh
similarity index 100%
rename from docker/test/performance-comparison/download.sh
rename to tests/performance/scripts/download.sh
diff --git a/docker/test/performance-comparison/entrypoint.sh b/tests/performance/scripts/entrypoint.sh
similarity index 89%
rename from docker/test/performance-comparison/entrypoint.sh
rename to tests/performance/scripts/entrypoint.sh
index fb5e6bd2a7a..95ffe44b654 100755
--- a/docker/test/performance-comparison/entrypoint.sh
+++ b/tests/performance/scripts/entrypoint.sh
@@ -7,8 +7,9 @@ export CHPC_CHECK_START_TIMESTAMP
 S3_URL=${S3_URL:="https://clickhouse-builds.s3.amazonaws.com"}
 BUILD_NAME=${BUILD_NAME:-package_release}
 export S3_URL BUILD_NAME
+SCRIPT_DIR="$(dirname "$(readlink -f "$0")")"
 
-# Sometimes AWS responde with DNS error and it's impossible to retry it with
+# Sometimes AWS responds with DNS error and it's impossible to retry it with
 # current curl version options.
 function curl_with_retry
 {
@@ -88,19 +89,9 @@ chmod 777 workspace output
 
 cd workspace
 
-# Download the package for the version we are going to test.
-# A temporary solution for migrating into PRs directory
-for prefix in "$S3_URL/PRs" "$S3_URL";
-do
-    if curl_with_retry "$prefix/$PR_TO_TEST/$SHA_TO_TEST/$BUILD_NAME/performance.tar.zst"
-    then
-        right_path="$prefix/$PR_TO_TEST/$SHA_TO_TEST/$BUILD_NAME/performance.tar.zst"
-        break
-    fi
-done
-
-mkdir right
-wget -nv -nd -c "$right_path" -O- | tar -C right --no-same-owner --strip-components=1 --zstd --extract --verbose
+[ ! -e "/artifacts/performance.tar.zst" ] && echo "ERROR: performance.tar.zst not found" && exit 1
+mkdir -p right
+tar -xf "/artifacts/performance.tar.zst" -C right --no-same-owner --strip-components=1 --zstd --extract --verbose
 
 # Find reference revision if not specified explicitly
 if [ "$REF_SHA" == "" ]; then find_reference_sha; fi
@@ -158,7 +149,7 @@ cat /proc/sys/kernel/core_pattern
 
 # Start the main comparison script.
 {
-    time ../download.sh "$REF_PR" "$REF_SHA" "$PR_TO_TEST" "$SHA_TO_TEST" && \
+    time $SCRIPT_DIR/download.sh "$REF_PR" "$REF_SHA" "$PR_TO_TEST" "$SHA_TO_TEST" && \
     time stage=configure "$script_path"/compare.sh ; \
 } 2>&1 | ts "$(printf '%%Y-%%m-%%d %%H:%%M:%%S\t')" | tee compare.log
 
diff --git a/docker/test/performance-comparison/eqmed.sql b/tests/performance/scripts/eqmed.sql
similarity index 97%
rename from docker/test/performance-comparison/eqmed.sql
rename to tests/performance/scripts/eqmed.sql
index d0111550ee6..94e6733a3d7 100644
--- a/docker/test/performance-comparison/eqmed.sql
+++ b/tests/performance/scripts/eqmed.sql
@@ -12,7 +12,7 @@ from
       -- quantiles of randomization distributions
       -- note that for small number of runs, the exact quantile might not make
       -- sense, because the last possible value of randomization distribution
-      -- might take a larger percentage of distirbution (i.e. the distribution
+      -- might take a larger percentage of distribution (i.e. the distribution
       -- actually has discrete values, and the last step can be large).
       select quantileExactForEach(0.99)(
         arrayMap(x, y -> abs(x - y), metrics_by_label[1], metrics_by_label[2]) as d
@@ -44,7 +44,7 @@ from
                               -- for each virtual run, randomly reorder measurements
                               order by virtual_run, rand()
                            ) virtual_runs
-                     ) relabeled 
+                     ) relabeled
                   group by virtual_run, random_label
                ) virtual_medians
             group by virtual_run -- aggregate by random_label
diff --git a/docker/test/performance-comparison/manual-run.sh b/tests/performance/scripts/manual-run.sh
similarity index 99%
rename from docker/test/performance-comparison/manual-run.sh
rename to tests/performance/scripts/manual-run.sh
index 2cc40bf4648..82609489d72 100755
--- a/docker/test/performance-comparison/manual-run.sh
+++ b/tests/performance/scripts/manual-run.sh
@@ -51,4 +51,3 @@ run
 
 rm output.7z
 7z a output.7z ./*.{log,tsv,html,txt,rep,svg} {right,left}/{performance,db/preprocessed_configs}
-
diff --git a/docker/test/performance-comparison/perf.py b/tests/performance/scripts/perf.py
similarity index 99%
rename from docker/test/performance-comparison/perf.py
rename to tests/performance/scripts/perf.py
index d23a9ac61c1..e98c158249a 100755
--- a/docker/test/performance-comparison/perf.py
+++ b/tests/performance/scripts/perf.py
@@ -357,7 +357,7 @@ for query_index in queries_to_run:
             prewarm_id = f"{query_prefix}.prewarm0"
 
             try:
-                # During the warmup runs, we will also:
+                # During the warm-up runs, we will also:
                 # * detect queries that are exceedingly long, to fail fast,
                 # * collect profiler traces, which might be helpful for analyzing
                 #   test coverage. We disable profiler for normal runs because
@@ -390,7 +390,7 @@ for query_index in queries_to_run:
             query_error_on_connection[conn_index] = traceback.format_exc()
             continue
 
-    # Report all errors that ocurred during prewarm and decide what to do next.
+    # Report all errors that occurred during prewarm and decide what to do next.
     # If prewarm fails for the query on all servers -- skip the query and
     # continue testing the next query.
     # If prewarm fails on one of the servers, run the query on the rest of them.
diff --git a/docker/test/performance-comparison/report.py b/tests/performance/scripts/report.py
similarity index 100%
rename from docker/test/performance-comparison/report.py
rename to tests/performance/scripts/report.py
diff --git a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.reference b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.reference
index cd9f0142d45..d8c0db3b996 100644
--- a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.reference
+++ b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.reference
@@ -1,15 +1,15 @@
-runtime messages	0.001
-runtime exceptions	0.05
-unknown runtime exceptions	0.01
-messages shorter than 10	1
-messages shorter than 16	3
-exceptions shorter than 30	3	[]
-noisy messages	0.3
-noisy Trace messages	0.16
-noisy Debug messages	0.09
-noisy Info messages	0.05
-noisy Warning messages	0.01
-noisy Error messages	0.02
+runtime messages	0.001	[]
+runtime exceptions	0.05	[]
+unknown runtime exceptions	0.01	[]
+messages shorter than 10	1	[]
+messages shorter than 16	1	[]
+exceptions shorter than 30	1	[]
+noisy messages	0.3	
+noisy Trace messages	0.16	
+noisy Debug messages	0.09	
+noisy Info messages	0.05	
+noisy Warning messages	0.01	
+noisy Error messages	0.03	
 no Fatal messages	0
 number of too noisy messages	3
 number of noisy messages	10
diff --git a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
index 062806baae9..3a83126ea11 100644
--- a/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
+++ b/tests/queries/0_stateless/00002_log_and_exception_messages_formatting.sql
@@ -9,57 +9,174 @@ create view logs as select * from system.text_log where now() - toIntervalMinute
 
 -- Check that we don't have too many messages formatted with fmt::runtime or strings concatenation.
 -- 0.001 threshold should be always enough, the value was about 0.00025
-select 'runtime messages', greatest(coalesce(sum(length(message_format_string) = 0) / countOrNull(), 0), 0.001) from logs
-    where message not like '% Received from %clickhouse-staging.com:9440%';
+WITH 0.001 AS threshold
+SELECT
+    'runtime messages',
+    greatest(coalesce(sum(length(message_format_string) = 0) / countOrNull(), 0) as v, threshold),
+    v <= threshold ? [] :
+        (SELECT groupArray((message, c)) FROM (
+            SELECT message, count() as c FROM logs
+            WHERE
+                length(message_format_string) = 0
+              AND message not like '% Received from %clickhouse-staging.com:9440%'
+              AND source_file not like '%/AWSLogger.cpp%'
+            GROUP BY message ORDER BY c LIMIT 10
+        ))
+FROM logs
+WHERE
+    message NOT LIKE '% Received from %clickhouse-staging.com:9440%'
+  AND source_file not like '%/AWSLogger.cpp%';
 
 -- Check the same for exceptions. The value was 0.03
-select 'runtime exceptions', greatest(coalesce(sum(length(message_format_string) = 0) / countOrNull(), 0), 0.05) from logs
-    where (message like '%DB::Exception%' or message like '%Coordination::Exception%')
-    and message not like '% Received from %clickhouse-staging.com:9440%';
+WITH 0.05 AS threshold
+SELECT
+    'runtime exceptions',
+    greatest(coalesce(sum(length(message_format_string) = 0) / countOrNull(), 0) as v, threshold),
+    v <= threshold ? [] :
+        (SELECT groupArray((message, c)) FROM (
+            SELECT message, count() as c FROM logs
+            WHERE
+                length(message_format_string) = 0
+              AND (message like '%DB::Exception%' or message like '%Coordination::Exception%')
+              AND message not like '% Received from %clickhouse-staging.com:9440%'
+            GROUP BY message ORDER BY c LIMIT 10
+        ))
+FROM logs
+WHERE
+    message NOT LIKE '% Received from %clickhouse-staging.com:9440%'
+  AND (message like '%DB::Exception%' or message like '%Coordination::Exception%');
+
+WITH 0.01 AS threshold
+SELECT
+    'unknown runtime exceptions',
+    greatest(coalesce(sum(length(message_format_string) = 0) / countOrNull(), 0) as v, threshold),
+    v <= threshold ? [] :
+        (SELECT groupArray((message, c)) FROM (
+            SELECT message, count() as c FROM logs
+            WHERE
+                length(message_format_string) = 0
+              AND (message like '%DB::Exception%' or message like '%Coordination::Exception%')
+              AND message not like '% Received from %' and message not like '%(SYNTAX_ERROR)%'
+            GROUP BY message ORDER BY c LIMIT 10
+        ))
+FROM logs
+WHERE
+  (message like '%DB::Exception%' or message like '%Coordination::Exception%')
+  AND message not like '% Received from %' and message not like '%(SYNTAX_ERROR)%';
 
-select 'unknown runtime exceptions', greatest(coalesce(sum(length(message_format_string) = 0) / countOrNull(), 0), 0.01) from logs where
-    (message like '%DB::Exception%' or message like '%Coordination::Exception%')
-    and message not like '% Received from %' and message not like '%(SYNTAX_ERROR)%';
 
 -- FIXME some of the following messages are not informative and it has to be fixed
-create temporary table known_short_messages (s String) as select * from (select
-['', '{} ({})', '({}) Keys: {}', '({}) {}', 'Aggregating', 'Became leader', 'Cleaning queue',
-'Creating set.', 'Cyclic aliases', 'Detaching {}', 'Executing {}', 'Fire events: {}',
-'Found part {}', 'Loaded queue', 'No sharding key', 'No tables', 'Query: {}', 'Removed',
-'Removed part {}', 'Removing parts.', 'Request URI: {}', 'Sending part {}',
-'Sent handshake', 'Starting {}', 'Will mimic {}', 'Writing to {}', 'dropIfEmpty',
-'loadAll {}', '{} ({}:{})', '{} -> {}', '{} {}', '{}: {}', '{}%', 'Read object: {}',
-'New segment: {}', 'Convert overflow', 'Division by zero', 'Files set to {}',
-'Bytes set to {}', 'Numeric overflow', 'Invalid mode: {}',
-'Write file: {}', 'Unable to parse JSONPath', 'Host is empty in S3 URI.', 'Expected end of line',
-'inflate failed: {}{}', 'Center is not valid', 'Column ''{}'' is ambiguous', 'Cannot parse object', 'Invalid date: {}',
-'There is no cache by name: {}', 'No part {} in table', '`{}` should be a String', 'There are duplicate id {}',
-'Invalid replica name: {}', 'Unexpected value {} in enum', 'Unknown BSON type: {}', 'Point is not valid',
-'Invalid qualified name: {}', 'INTO OUTFILE is not allowed', 'Arguments must not be NaN', 'Cell is not valid',
-'brotli decode error{}', 'Invalid H3 index: {}', 'Too large node state size', 'No additional keys found.',
-'Attempt to read after EOF.', 'Replication was stopped', '{}	building file infos', 'Cannot parse uuid {}',
-'Query was cancelled', 'Cancelled merging parts', 'Cancelled mutating parts', 'Log pulling is cancelled',
-'Transaction was cancelled', 'Could not find table: {}', 'Table {} does not exist',
-'Database {} does not exist', 'Dictionary ({}) not found', 'Unknown table function {}',
-'Unknown format {}', 'Unknown explain kind ''{}''', 'Unknown setting {}', 'Unknown input format {}',
-'Unknown identifier: ''{}''', 'User name is empty', 'Expected function, got: {}',
-'Attempt to read after eof', 'String size is too big ({}), maximum: {}',
-'Processed: {}%', 'Creating {}: {}', 'Table {}.{} doesn''t exist', 'Invalid cache key hex: {}',
-'User has been dropped', 'Illegal type {} of argument of function {}. Should be DateTime or DateTime64',
-'Unknown statistic column: {}',
-'Bad SSH public key provided', 'Database {} does not exist', 'Substitution {} is not set', 'Invalid cache key hex: {}'
-] as arr) array join arr;
+create temporary table known_short_messages (s String) as select * from (select [
+    '',
+    '({}) Keys: {}',
+    '({}) {}',
+    'Aggregating',
+    'Attempt to read after EOF.',
+    'Attempt to read after eof',
+    'Bad SSH public key provided',
+    'Became leader',
+    'Bytes set to {}',
+    'Cancelled merging parts',
+    'Cancelled mutating parts',
+    'Cannot parse date here: {}',
+    'Cannot parse object',
+    'Cannot parse uuid {}',
+    'Cleaning queue',
+    'Column \'{}\' is ambiguous',
+    'Convert overflow',
+    'Could not find table: {}',
+    'Creating {}: {}',
+    'Cyclic aliases',
+    'Database {} does not exist',
+    'Detaching {}',
+    'Dictionary ({}) not found',
+    'Division by zero',
+    'Executing {}',
+    'Expected end of line',
+    'Expected function, got: {}',
+    'Files set to {}',
+    'Fire events: {}',
+    'Found part {}',
+    'Host is empty in S3 URI.',
+    'INTO OUTFILE is not allowed',
+    'Illegal type {} of argument of function {}. Should be DateTime or DateTime64',
+    'Illegal UTF-8 sequence, while processing \'{}\'',
+    'Invalid cache key hex: {}',
+    'Invalid date: {}',
+    'Invalid mode: {}',
+    'Invalid qualified name: {}',
+    'Invalid replica name: {}',
+    'Loaded queue',
+    'Log pulling is cancelled',
+    'New segment: {}',
+    'No additional keys found.',
+    'No part {} in table',
+    'No sharding key',
+    'No tables',
+    'Numeric overflow',
+    'Path to archive is empty',
+    'Processed: {}%',
+    'Query was cancelled',
+    'Query: {}',
+    'Read object: {}',
+    'Removed part {}',
+    'Removing parts.',
+    'Replication was stopped',
+    'Request URI: {}',
+    'Sending part {}',
+    'Sent handshake',
+    'Starting {}',
+    'String size is too big ({}), maximum: {}',
+    'Substitution {} is not set',
+    'Table {} does not exist',
+    'Table {}.{} doesn\'t exist',
+    'There are duplicate id {}',
+    'There is no cache by name: {}',
+    'Too large node state size',
+    'Transaction was cancelled',
+    'Unable to parse JSONPath',
+    'Unexpected value {} in enum',
+    'Unknown BSON type: {}',
+    'Unknown explain kind \'{}\'',
+    'Unknown format {}',
+    'Unknown identifier: \'{}\'',
+    'Unknown input format {}',
+    'Unknown setting {}',
+    'Unknown statistic column: {}',
+    'Unknown table function {}',
+    'User has been dropped',
+    'User name is empty',
+    'Will mimic {}',
+    'Write file: {}',
+    'Writing to {}',
+    '`{}` should be a String',
+    'brotli decode error{}',
+    'dropIfEmpty',
+    'inflate failed: {}{}',
+    'loadAll {}',
+    '{} ({})',
+    '{} ({}:{})',
+    '{} -> {}',
+    '{} {}',
+    '{}%',
+    '{}: {}'
+    ] as arr) array join arr;
 
 -- Check that we don't have too many short meaningless message patterns.
+WITH 1 AS max_messages
 select 'messages shorter than 10',
-    greatest(uniqExact(message_format_string), 1)
+    (uniqExact(message_format_string) as c) <= max_messages,
+    c <= max_messages ? [] : groupUniqArray(message_format_string)
     from logs
     where length(message_format_string) < 10 and message_format_string not in known_short_messages;
 
 -- Same as above. Feel free to update the threshold or remove this query if really necessary
+WITH 3 AS max_messages
 select 'messages shorter than 16',
-    greatest(uniqExact(message_format_string), 3)
-    from logs where length(message_format_string) < 16 and message_format_string not in known_short_messages;
+    (uniqExact(message_format_string) as c) <= max_messages,
+    c <= max_messages ? [] : groupUniqArray(message_format_string)
+    from logs
+    where length(message_format_string) < 16 and message_format_string not in known_short_messages;
 
 -- Unlike above, here we look at length of the formatted message, not format string. Most short format strings are fine because they end up decorated with context from outer or inner exceptions, e.g.:
 -- "Expected end of line" -> "Code: 117. DB::Exception: Expected end of line: (in file/uri /var/lib/clickhouse/user_files/data_02118): (at row 1)"
@@ -68,40 +185,53 @@ select 'messages shorter than 16',
 -- This table currently doesn't have enough information to do this reliably, so we just regex search for " (ERROR_NAME_IN_CAPS)" and hope that's good enough.
 -- For the "Code: 123. DB::Exception: " part, we just subtract 26 instead of searching for it. Because sometimes it's not at the start, e.g.:
 -- "Unexpected error, will try to restart main thread: Code: 341. DB::Exception: Unexpected error: Code: 57. DB::Exception:[...]"
+WITH 3 AS max_messages
 select 'exceptions shorter than 30',
-    greatest(uniqExact(message_format_string), 3) AS c,
-    c = 3 ? [] : groupUniqArray(message_format_string)
+    (uniqExact(message_format_string) as c) <= max_messages,
+    c <= max_messages ? [] : groupUniqArray(message_format_string)
     from logs
     where message ilike '%DB::Exception%' and if(length(extract(message, '(.*)\\([A-Z0-9_]+\\)')) as pref > 0, pref, length(message)) < 30 + 26 and message_format_string not in known_short_messages;
 
-
 -- Avoid too noisy messages: top 1 message frequency must be less than 30%. We should reduce the threshold
-select 'noisy messages',
-    greatest((select count() from logs group by message_format_string order by count() desc limit 1) / (select count() from logs), 0.30);
+WITH 0.30 as threshold
+select
+    'noisy messages',
+    greatest(coalesce(((select message_format_string, count() from logs group by message_format_string order by count() desc limit 1) as top_message).2, 0) / (select count() from logs), threshold) as r,
+    r <= threshold ? '' : top_message.1;
 
 -- Same as above, but excluding Test level (actually finds top 1 Trace message)
-with ('Access granted: {}{}', '{} -> {}') as frequent_in_tests
-select 'noisy Trace messages',
-    greatest((select count() from logs where level!='Test' and message_format_string not in frequent_in_tests
-        group by message_format_string order by count() desc limit 1) / (select count() from logs), 0.16);
+with 0.16 as threshold
+select
+    'noisy Trace messages',
+    greatest(coalesce(((select message_format_string, count() from logs where level = 'Trace' and message_format_string not in ('Access granted: {}{}', '{} -> {}')
+                        group by message_format_string order by count() desc limit 1) as top_message).2, 0) / (select count() from logs), threshold) as r,
+    r <= threshold ? '' : top_message.1;
 
 -- Same as above for Debug
+WITH 0.09 as threshold
 select 'noisy Debug messages',
-    greatest((select count() from logs where level <= 'Debug' group by message_format_string order by count() desc limit 1) / (select count() from logs), 0.09);
+       greatest(coalesce(((select message_format_string, count() from logs where level = 'Debug' group by message_format_string order by count() desc limit 1) as top_message).2, 0) / (select count() from logs), threshold) as r,
+       r <= threshold ? '' : top_message.1;
 
 -- Same as above for Info
+WITH 0.05 as threshold
 select 'noisy Info messages',
-    greatest((select count() from logs where level <= 'Information' group by message_format_string order by count() desc limit 1) / (select count() from logs), 0.05);
+       greatest(coalesce(((select message_format_string, count() from logs where level = 'Information' group by message_format_string order by count() desc limit 1) as top_message).2, 0) / (select count() from logs), threshold) as r,
+       r <= threshold ? '' : top_message.1;
 
 -- Same as above for Warning
-with ('Not enabled four letter command {}') as frequent_in_tests
-select 'noisy Warning messages',
-    greatest(coalesce((select count() from logs where level = 'Warning' and message_format_string not in frequent_in_tests
-    group by message_format_string order by count() desc limit 1), 0) / (select count() from logs), 0.01);
+with 0.01 as threshold
+select
+    'noisy Warning messages',
+    greatest(coalesce(((select message_format_string, count() from logs where level = 'Warning' and message_format_string not in ('Not enabled four letter command {}')
+                       group by message_format_string order by count() desc limit 1) as top_message).2, 0) / (select count() from logs), threshold) as r,
+    r <= threshold ? '' : top_message.1;
 
 -- Same as above for Error
+WITH 0.03 as threshold
 select 'noisy Error messages',
-    greatest(coalesce((select count() from logs where level = 'Error' group by message_format_string order by count() desc limit 1), 0) / (select count() from logs), 0.02);
+    greatest(coalesce(((select message_format_string, count() from logs where level = 'Error' group by message_format_string order by count() desc limit 1) as top_message).2, 0) / (select count() from logs), threshold) as r,
+    r <= threshold ? '' : top_message.1;
 
 select 'no Fatal messages', count() from logs where level = 'Fatal';
 
diff --git a/tests/queries/0_stateless/00109_shard_totals_after_having.sql b/tests/queries/0_stateless/00109_shard_totals_after_having.sql
index b17accc0dae..dce265e0552 100644
--- a/tests/queries/0_stateless/00109_shard_totals_after_having.sql
+++ b/tests/queries/0_stateless/00109_shard_totals_after_having.sql
@@ -4,6 +4,9 @@ SET max_rows_to_group_by = 100000;
 SET max_block_size = 100001;
 SET group_by_overflow_mode = 'any';
 
+-- Settings 'max_rows_to_group_by' and 'max_bytes_before_external_group_by' are mutually exclusive.
+SET max_bytes_before_external_group_by = 0;
+
 DROP TABLE IF EXISTS numbers500k;
 CREATE TABLE  numbers500k (number UInt32) ENGINE = TinyLog;
 
diff --git a/tests/queries/0_stateless/00119_storage_join.sql b/tests/queries/0_stateless/00119_storage_join.sql
index 2569a64d2c3..cd255cdfe24 100644
--- a/tests/queries/0_stateless/00119_storage_join.sql
+++ b/tests/queries/0_stateless/00119_storage_join.sql
@@ -12,7 +12,7 @@ SELECT x, s, k FROM (SELECT number AS k FROM system.numbers LIMIT 10) js1 ANY LE
 SELECT 1, x, 2, s, 3, k, 4 FROM (SELECT number AS k FROM system.numbers LIMIT 10) js1 ANY LEFT JOIN t2 USING k;
 
 SELECT t1.k, t1.s, t2.x
-FROM ( SELECT number AS k, 'a' AS s FROM numbers(2) GROUP BY number WITH TOTALS ) AS t1
+FROM ( SELECT number AS k, 'a' AS s FROM numbers(2) GROUP BY number WITH TOTALS ORDER BY number) AS t1
 ANY LEFT JOIN t2 AS t2 USING(k);
 
 DROP TABLE t2;
diff --git a/tests/queries/0_stateless/00133_long_shard_memory_tracker_and_exception_safety.sh b/tests/queries/0_stateless/00133_long_shard_memory_tracker_and_exception_safety.sh
index 389a2cd9684..a42fd58190a 100755
--- a/tests/queries/0_stateless/00133_long_shard_memory_tracker_and_exception_safety.sh
+++ b/tests/queries/0_stateless/00133_long_shard_memory_tracker_and_exception_safety.sh
@@ -16,7 +16,7 @@ if [ -n "$DBMS_TESTS_UNDER_VALGRIND" ]; then
 fi
 
 for i in $(seq 1000000 $((20000 * $STEP_MULTIPLIER)) 10000000 && seq 10100000 $((100000 * $STEP_MULTIPLIER)) 50000000); do
-    $CLICKHOUSE_CLIENT --max_memory_usage="$i" --query="
+    $CLICKHOUSE_CLIENT --max_memory_usage="$i" --max_bytes_before_external_group_by 0 --query="
         SELECT intDiv(number, 5) AS k, max(toString(number)) FROM remote('127.0.0.{2,3}', ${CLICKHOUSE_DATABASE}.numbers_100k) GROUP BY k ORDER BY k LIMIT 1;
     " 2> /dev/null;
     CODE=$?;
diff --git a/tests/queries/0_stateless/00155_long_merges.sh b/tests/queries/0_stateless/00155_long_merges.sh
index 9ed0f2c6de1..8ecca0aeb42 100755
--- a/tests/queries/0_stateless/00155_long_merges.sh
+++ b/tests/queries/0_stateless/00155_long_merges.sh
@@ -34,32 +34,40 @@ function test {
 
     SETTINGS="--min_insert_block_size_rows=0 --min_insert_block_size_bytes=0 --max_block_size=65505"
 
+    $CLICKHOUSE_CLIENT --query="SYSTEM STOP MERGES summing_00155"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO summing_00155 (x) SELECT number AS x FROM system.numbers LIMIT $1"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO summing_00155 (x) SELECT number AS x FROM system.numbers LIMIT $2"
 
+    $CLICKHOUSE_CLIENT --query="SYSTEM STOP MERGES collapsing_00155"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO collapsing_00155 (x) SELECT number AS x FROM system.numbers LIMIT $1"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO collapsing_00155 (x) SELECT number AS x FROM system.numbers LIMIT $2"
 
+    $CLICKHOUSE_CLIENT --query="SYSTEM STOP MERGES aggregating_00155"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO aggregating_00155 (d, x, s) SELECT today() AS d, number AS x, sumState(materialize(toUInt64(1))) AS s FROM (SELECT number FROM system.numbers LIMIT $1) GROUP BY number"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO aggregating_00155 (d, x, s) SELECT today() AS d, number AS x, sumState(materialize(toUInt64(1))) AS s FROM (SELECT number FROM system.numbers LIMIT $2) GROUP BY number"
 
+    $CLICKHOUSE_CLIENT --query="SYSTEM STOP MERGES replacing_00155"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO replacing_00155 (x, v) SELECT number AS x, toUInt64(number % 3 == 0) FROM system.numbers LIMIT $1"
     $CLICKHOUSE_CLIENT $SETTINGS --query="INSERT INTO replacing_00155 (x, v) SELECT number AS x, toUInt64(number % 3 == 1) FROM system.numbers LIMIT $2"
 
     $CLICKHOUSE_CLIENT --query="SELECT count() = $SUM, sum(s) = $SUM FROM summing_00155"
+    $CLICKHOUSE_CLIENT --query="SYSTEM START MERGES summing_00155"
     $CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE summing_00155"
     $CLICKHOUSE_CLIENT --query="SELECT count() = $MAX, sum(s) = $SUM FROM summing_00155"
     echo
     $CLICKHOUSE_CLIENT --query="SELECT count() = $SUM, sum(s) = $SUM FROM collapsing_00155"
-    $CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE collapsing_00155" --server_logs_file='/dev/null';
+    $CLICKHOUSE_CLIENT --query="SYSTEM START MERGES collapsing_00155"
+    $CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE collapsing_00155 FINAL" --server_logs_file='/dev/null';
     $CLICKHOUSE_CLIENT --query="SELECT count() = $MAX, sum(s) = $MAX FROM collapsing_00155"
     echo
     $CLICKHOUSE_CLIENT --query="SELECT count() = $SUM, sumMerge(s) = $SUM FROM aggregating_00155"
-    $CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE aggregating_00155"
+    $CLICKHOUSE_CLIENT --query="SYSTEM START MERGES aggregating_00155"
+    $CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE aggregating_00155 FINAL"
     $CLICKHOUSE_CLIENT --query="SELECT count() = $MAX, sumMerge(s) = $SUM FROM aggregating_00155"
     echo
     $CLICKHOUSE_CLIENT --query="SELECT count() = $SUM, sum(s) = $SUM FROM replacing_00155"
-    $CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE replacing_00155"
+    $CLICKHOUSE_CLIENT --query="SYSTEM START MERGES replacing_00155"
+    $CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE replacing_00155 FINAL"
     $CLICKHOUSE_CLIENT --query="SELECT count() = $MAX, sum(s) = $MAX FROM replacing_00155"
     $CLICKHOUSE_CLIENT --query="SELECT count() = sum(v) FROM replacing_00155 where x % 3 == 0 and x < $1"
     $CLICKHOUSE_CLIENT --query="SELECT count() = sum(v) FROM replacing_00155 where x % 3 == 1 and x < $2"
diff --git a/tests/queries/0_stateless/00166_functions_of_aggregation_states.sql b/tests/queries/0_stateless/00166_functions_of_aggregation_states.sql
index b73a04e19b9..0a5a84bbb46 100644
--- a/tests/queries/0_stateless/00166_functions_of_aggregation_states.sql
+++ b/tests/queries/0_stateless/00166_functions_of_aggregation_states.sql
@@ -1 +1,4 @@
+-- Disable external aggregation because the state is reset for each new block of data in 'runningAccumulate' function.
+SET max_bytes_before_external_group_by = 0;
+
 SELECT k, finalizeAggregation(sum_state), runningAccumulate(sum_state) FROM (SELECT intDiv(number, 50000) AS k, sumState(number) AS sum_state FROM (SELECT number FROM system.numbers LIMIT 1000000) GROUP BY k ORDER BY k);
diff --git a/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.reference b/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.reference
index b2b0b43e490..72828aae5a9 100644
--- a/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.reference
+++ b/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.reference
@@ -36,9 +36,9 @@ GROUP BY ORDER BY
 1
 GROUP BY w/ ALIAS
 0
-1
 0
 1
+1
 ORDER BY w/ ALIAS
 0
 func(aggregate function) GROUP BY
diff --git a/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.sql b/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.sql
index 422f4a010f1..1bd6cbe8948 100644
--- a/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.sql
+++ b/tests/queries/0_stateless/00184_shard_distributed_group_by_no_merge.sql
@@ -34,7 +34,7 @@ SELECT uniq(number) u FROM remote('127.0.0.{2,3}', currentDatabase(), data_00184
 
 -- cover possible tricky issues
 SELECT 'GROUP BY w/ ALIAS';
-SELECT n FROM remote('127.0.0.{2,3}', currentDatabase(), data_00184) GROUP BY number AS n SETTINGS distributed_group_by_no_merge=2;
+SELECT n FROM remote('127.0.0.{2,3}', currentDatabase(), data_00184) GROUP BY number AS n ORDER BY n SETTINGS distributed_group_by_no_merge=2;
 
 SELECT 'ORDER BY w/ ALIAS';
 SELECT n FROM remote('127.0.0.{2,3}', currentDatabase(), data_00184) ORDER BY number AS n LIMIT 1 SETTINGS distributed_group_by_no_merge=2;
diff --git a/tests/queries/0_stateless/00232_format_readable_size.sql b/tests/queries/0_stateless/00232_format_readable_size.sql
index e96f7ebeb20..0fa6f1a8b3a 100644
--- a/tests/queries/0_stateless/00232_format_readable_size.sql
+++ b/tests/queries/0_stateless/00232_format_readable_size.sql
@@ -1,4 +1,4 @@
 WITH round(exp(number), 6) AS x, x > 0xFFFFFFFFFFFFFFFF ? 0xFFFFFFFFFFFFFFFF : toUInt64(x) AS y, x > 0x7FFFFFFF ? 0x7FFFFFFF : toInt32(x) AS z
-SELECT formatReadableSize(x), formatReadableSize(y), formatReadableSize(z)
+SELECT FORMAT_BYTES(x), format_bytes(y), formatReadableSize(z)
 FROM system.numbers
 LIMIT 70;
diff --git a/tests/queries/0_stateless/00273_quantiles.sql b/tests/queries/0_stateless/00273_quantiles.sql
index 9fef1f63057..f5b739b8be1 100644
--- a/tests/queries/0_stateless/00273_quantiles.sql
+++ b/tests/queries/0_stateless/00273_quantiles.sql
@@ -8,4 +8,7 @@ SELECT quantilesExact(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0
 SELECT quantilesTDigest(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 SELECT quantilesDeterministic(0, 0.001, 0.01, 0.05, 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9, 0.95, 0.99, 0.999, 1)(x, x) FROM (SELECT number AS x FROM system.numbers LIMIT 1001);
 
+-- The result slightly differs but it's ok since `quantilesDeterministic` is an approximate function.
+SET max_bytes_before_external_group_by = 0;
+
 SELECT round(1000000 / (number + 1)) AS k, count() AS c, arrayMap(x -> round(x, 6), quantilesDeterministic(0.1, 0.5, 0.9)(number, intHash64(number))) AS q1, quantilesExact(0.1, 0.5, 0.9)(number) AS q2 FROM (SELECT number FROM system.numbers LIMIT 1000000) GROUP BY k ORDER BY k;
diff --git a/tests/queries/0_stateless/00410_aggregation_combinators_with_arenas.sql b/tests/queries/0_stateless/00410_aggregation_combinators_with_arenas.sql
index 67f5cc54afd..a3abbb9fd58 100644
--- a/tests/queries/0_stateless/00410_aggregation_combinators_with_arenas.sql
+++ b/tests/queries/0_stateless/00410_aggregation_combinators_with_arenas.sql
@@ -7,4 +7,8 @@ DROP TABLE IF EXISTS arena;
 
 SELECT length(arrayReduce('groupUniqArray', [[1, 2], [1],  emptyArrayUInt8(), [1], [1, 2]]));
 SELECT min(x), max(x) FROM (SELECT length(arrayReduce('groupUniqArray', [hex(number), hex(number+1), hex(number)])) AS x FROM system.numbers LIMIT 100000);
+
+-- Disable external aggregation because the state is reset for each new block of data in 'runningAccumulate' function.
+SET max_bytes_before_external_group_by = 0;
+
 SELECT sum(length(runningAccumulate(x))) FROM (SELECT groupUniqArrayState(toString(number % 10)) AS x, number FROM (SELECT * FROM system.numbers LIMIT 11) GROUP BY number ORDER BY number);
diff --git a/tests/queries/0_stateless/00493_substring_of_fixedstring.reference b/tests/queries/0_stateless/00493_substring_of_fixedstring.reference
deleted file mode 100644
index 72d55841a37..00000000000
--- a/tests/queries/0_stateless/00493_substring_of_fixedstring.reference
+++ /dev/null
@@ -1,52 +0,0 @@
-hello\0\0\0
-hello\0\0\0
-0\0\0\0\0\0\0\0
-1\0\0\0\0\0\0\0
-2\0\0\0\0\0\0\0
-3\0\0\0\0\0\0\0
-4\0\0\0\0\0\0\0
-5\0\0\0\0\0\0\0
-6\0\0\0\0\0\0\0
-7\0\0\0\0\0\0\0
-8\0\0\0\0\0\0\0
-9\0\0\0\0\0\0\0
-995
-996
-997
-998
-999
-100
-100
-100
-100
-100
-
-9
-99
-998
-999\0
-
-1
-10
-100
-1004
-995\0
-96\0
-7\0
-\0
-
-1000
-001
-02
-3
-
-995
-9
-7\0
-\0
-
-10
-001
-0
-3
-
diff --git a/tests/queries/0_stateless/00493_substring_of_fixedstring.sql b/tests/queries/0_stateless/00493_substring_of_fixedstring.sql
deleted file mode 100644
index e267e1d54bb..00000000000
--- a/tests/queries/0_stateless/00493_substring_of_fixedstring.sql
+++ /dev/null
@@ -1,7 +0,0 @@
-SELECT substring(toFixedString('hello', 16), 1, 8);
-SELECT substring(toFixedString(materialize('hello'), 16), 1, 8);
-SELECT substring(toFixedString(toString(number), 16), 1, 8) FROM system.numbers LIMIT 10;
-SELECT substring(toFixedString(toString(number), 4), 1, 3) FROM system.numbers LIMIT 995, 10;
-SELECT substring(toFixedString(toString(number), 4), 1, number % 5) FROM system.numbers LIMIT 995, 10;
-SELECT substring(toFixedString(toString(number), 4), 1 + number % 5) FROM system.numbers LIMIT 995, 10;
-SELECT substring(toFixedString(toString(number), 4), 1 + number % 5, 1 + number % 3) FROM system.numbers LIMIT 995, 10;
diff --git a/tests/queries/0_stateless/00496_substring_negative_offset.reference b/tests/queries/0_stateless/00496_substring_negative_offset.reference
deleted file mode 100644
index b592f370dea..00000000000
--- a/tests/queries/0_stateless/00496_substring_negative_offset.reference
+++ /dev/null
@@ -1,40 +0,0 @@
-abc
-abc
-abc
-bc
-c
-
-abc
-bc
-c
-
-abc
-abc
-abc
-bc
-c
-
-abc
-bc
-c
-
-abc
-abc
-abc
-bc
-c
-
-abc
-bc
-c
-
-abc
-abc
-abc
-bc
-c
-
-abc
-bc
-c
-
diff --git a/tests/queries/0_stateless/00496_substring_negative_offset.sql b/tests/queries/0_stateless/00496_substring_negative_offset.sql
deleted file mode 100644
index 170af8f79b4..00000000000
--- a/tests/queries/0_stateless/00496_substring_negative_offset.sql
+++ /dev/null
@@ -1,4 +0,0 @@
-SELECT substring('abc', number - 5) FROM system.numbers LIMIT 10;
-SELECT substring(materialize('abc'), number - 5) FROM system.numbers LIMIT 10;
-SELECT substring(toFixedString('abc', 3), number - 5) FROM system.numbers LIMIT 10;
-SELECT substring(materialize(toFixedString('abc', 3)), number - 5) FROM system.numbers LIMIT 10;
diff --git a/tests/queries/0_stateless/00502_sum_map.reference b/tests/queries/0_stateless/00502_sum_map.reference
index b1cd0303004..0c9bebefd0b 100644
--- a/tests/queries/0_stateless/00502_sum_map.reference
+++ b/tests/queries/0_stateless/00502_sum_map.reference
@@ -63,7 +63,7 @@ SELECT sumMap(statusMap.goal_id, statusMap.revenue) FROM sum_map_decimal;
 SELECT sumMapWithOverflow(statusMap.goal_id, statusMap.revenue) FROM sum_map_decimal;
 ([1,2,3,4,5,6,7,8],[1,2,6,8,10,12,7,8])
 DROP TABLE sum_map_decimal;
-CREATE TABLE sum_map_decimal_nullable (`statusMap` Array(Tuple(goal_id UInt16, revenue Nullable(Decimal(9, 5))))) engine=Log;
+CREATE TABLE sum_map_decimal_nullable (`statusMap` Nested(goal_id UInt16, revenue Nullable(Decimal(9, 5)))) engine=Log;
 INSERT INTO sum_map_decimal_nullable VALUES ([1, 2, 3], [1.0, 2.0, 3.0]), ([3, 4, 5], [3.0, 4.0, 5.0]), ([4, 5, 6], [4.0, 5.0, 6.0]), ([6, 7, 8], [6.0, 7.0, 8.0]);
 SELECT sumMap(statusMap.goal_id, statusMap.revenue) FROM sum_map_decimal_nullable;
 ([1,2,3,4,5,6,7,8],[1,2,6,8,10,12,7,8])
diff --git a/tests/queries/0_stateless/00502_sum_map.sql b/tests/queries/0_stateless/00502_sum_map.sql
index 30037d49784..7d44bde6d50 100644
--- a/tests/queries/0_stateless/00502_sum_map.sql
+++ b/tests/queries/0_stateless/00502_sum_map.sql
@@ -56,7 +56,7 @@ SELECT sumMapWithOverflow(statusMap.goal_id, statusMap.revenue) FROM sum_map_dec
 
 DROP TABLE sum_map_decimal;
 
-CREATE TABLE sum_map_decimal_nullable (`statusMap` Array(Tuple(goal_id UInt16, revenue Nullable(Decimal(9, 5))))) engine=Log;
+CREATE TABLE sum_map_decimal_nullable (`statusMap` Nested(goal_id UInt16, revenue Nullable(Decimal(9, 5)))) engine=Log;
 INSERT INTO sum_map_decimal_nullable VALUES ([1, 2, 3], [1.0, 2.0, 3.0]), ([3, 4, 5], [3.0, 4.0, 5.0]), ([4, 5, 6], [4.0, 5.0, 6.0]), ([6, 7, 8], [6.0, 7.0, 8.0]);
 SELECT sumMap(statusMap.goal_id, statusMap.revenue) FROM sum_map_decimal_nullable;
 DROP TABLE sum_map_decimal_nullable;
diff --git a/tests/queries/0_stateless/00577_replacing_merge_tree_vertical_merge.sql b/tests/queries/0_stateless/00577_replacing_merge_tree_vertical_merge.sql
index e3c1bb10426..871f96bb019 100644
--- a/tests/queries/0_stateless/00577_replacing_merge_tree_vertical_merge.sql
+++ b/tests/queries/0_stateless/00577_replacing_merge_tree_vertical_merge.sql
@@ -3,7 +3,7 @@ set optimize_on_insert = 0;
 drop table if exists tab_00577;
 create table tab_00577 (date Date, version UInt64, val UInt64) engine = ReplacingMergeTree(version) partition by date order by date settings enable_vertical_merge_algorithm = 1,
     vertical_merge_algorithm_min_rows_to_activate = 0, vertical_merge_algorithm_min_columns_to_activate = 0, min_rows_for_wide_part = 0,
-    min_bytes_for_wide_part = 0;
+    min_bytes_for_wide_part = 0, allow_experimental_replacing_merge_with_cleanup=1;
 insert into tab_00577 values ('2018-01-01', 2, 2), ('2018-01-01', 1, 1);
 insert into tab_00577 values ('2018-01-01', 0, 0);
 select * from tab_00577 order by version;
@@ -16,7 +16,7 @@ DROP TABLE IF EXISTS testCleanupR1;
 CREATE TABLE testCleanupR1 (uid String, version UInt32, is_deleted UInt8)
     ENGINE = ReplicatedReplacingMergeTree('/clickhouse/{database}/tables/test_cleanup/', 'r1', version, is_deleted)
     ORDER BY uid SETTINGS enable_vertical_merge_algorithm = 1, vertical_merge_algorithm_min_rows_to_activate = 0, vertical_merge_algorithm_min_columns_to_activate = 0, min_rows_for_wide_part = 0,
-    min_bytes_for_wide_part = 0;
+    min_bytes_for_wide_part = 0, allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO testCleanupR1 (*) VALUES ('d1', 1, 0),('d2', 1, 0),('d3', 1, 0),('d4', 1, 0);
 INSERT INTO testCleanupR1 (*) VALUES ('d3', 2, 1);
 INSERT INTO testCleanupR1 (*) VALUES ('d1', 2, 1);
diff --git a/tests/queries/0_stateless/00578_merge_table_and_table_virtual_column.sql b/tests/queries/0_stateless/00578_merge_table_and_table_virtual_column.sql
index c2bc334ea38..f292eb30648 100644
--- a/tests/queries/0_stateless/00578_merge_table_and_table_virtual_column.sql
+++ b/tests/queries/0_stateless/00578_merge_table_and_table_virtual_column.sql
@@ -13,6 +13,8 @@ CREATE TABLE numbers5 ENGINE = MergeTree ORDER BY number AS SELECT number FROM n
 SELECT count() FROM merge(currentDatabase(), '^numbers\\d+$');
 SELECT DISTINCT count() FROM merge(currentDatabase(), '^numbers\\d+$') GROUP BY number;
 
+SET optimize_aggregation_in_order = 0; -- FIXME : in order may happen before filter push down
+
 SET max_rows_to_read = 1000;
 
 SET max_threads = 'auto';
diff --git a/tests/queries/0_stateless/00731_long_merge_tree_select_opened_files.sh b/tests/queries/0_stateless/00731_long_merge_tree_select_opened_files.sh
index 11396dd34eb..1bb4dbd34de 100755
--- a/tests/queries/0_stateless/00731_long_merge_tree_select_opened_files.sh
+++ b/tests/queries/0_stateless/00731_long_merge_tree_select_opened_files.sh
@@ -8,7 +8,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-settings="--log_queries=1 --log_query_threads=1 --log_profile_events=1 --log_query_settings=1 --allow_deprecated_syntax_for_merge_tree=1"
+settings="--log_queries=1 --log_query_threads=1 --log_profile_events=1 --log_query_settings=1 --allow_deprecated_syntax_for_merge_tree=1 --max_bytes_before_external_group_by 0 --max_bytes_before_external_sort 0"
 
 # Test insert logging on each block and checkPacket() method
 
diff --git a/tests/queries/0_stateless/00732_quorum_insert_have_data_before_quorum_zookeeper_long.sql b/tests/queries/0_stateless/00732_quorum_insert_have_data_before_quorum_zookeeper_long.sql
index 23b368549f8..bff8c7e73ee 100644
--- a/tests/queries/0_stateless/00732_quorum_insert_have_data_before_quorum_zookeeper_long.sql
+++ b/tests/queries/0_stateless/00732_quorum_insert_have_data_before_quorum_zookeeper_long.sql
@@ -20,7 +20,6 @@ SET select_sequential_consistency=1;
 SELECT x FROM quorum1 ORDER BY x;
 SELECT x FROM quorum2 ORDER BY x;
 
-SET insert_keeper_fault_injection_probability=0;
 SET insert_quorum=2, insert_quorum_parallel=0;
 
 INSERT INTO quorum1 VALUES (4, '1990-11-15');
diff --git a/tests/queries/0_stateless/00732_quorum_insert_lost_part_and_alive_part_zookeeper_long.sql b/tests/queries/0_stateless/00732_quorum_insert_lost_part_and_alive_part_zookeeper_long.sql
index 74399c9f27c..a1859220c6c 100644
--- a/tests/queries/0_stateless/00732_quorum_insert_lost_part_and_alive_part_zookeeper_long.sql
+++ b/tests/queries/0_stateless/00732_quorum_insert_lost_part_and_alive_part_zookeeper_long.sql
@@ -11,7 +11,6 @@ CREATE TABLE quorum2(x UInt32, y Date) ENGINE ReplicatedMergeTree('/clickhouse/t
 
 SET insert_quorum=2, insert_quorum_parallel=0;
 SET select_sequential_consistency=1;
-SET insert_keeper_fault_injection_probability=0;
 
 INSERT INTO quorum1 VALUES (1, '2018-11-15');
 INSERT INTO quorum1 VALUES (2, '2018-11-15');
diff --git a/tests/queries/0_stateless/00732_quorum_insert_lost_part_zookeeper_long.sql b/tests/queries/0_stateless/00732_quorum_insert_lost_part_zookeeper_long.sql
index a61672249a8..61394447c3d 100644
--- a/tests/queries/0_stateless/00732_quorum_insert_lost_part_zookeeper_long.sql
+++ b/tests/queries/0_stateless/00732_quorum_insert_lost_part_zookeeper_long.sql
@@ -11,7 +11,6 @@ CREATE TABLE quorum2(x UInt32, y Date) ENGINE ReplicatedMergeTree('/clickhouse/t
 
 SET insert_quorum=2, insert_quorum_parallel=0;
 SET select_sequential_consistency=1;
-SET insert_keeper_fault_injection_probability=0;
 
 SET insert_quorum_timeout=0;
 
diff --git a/tests/queries/0_stateless/00732_quorum_insert_select_with_old_data_and_without_quorum_zookeeper_long.sql b/tests/queries/0_stateless/00732_quorum_insert_select_with_old_data_and_without_quorum_zookeeper_long.sql
index e821d7587ee..e3e5aa7949f 100644
--- a/tests/queries/0_stateless/00732_quorum_insert_select_with_old_data_and_without_quorum_zookeeper_long.sql
+++ b/tests/queries/0_stateless/00732_quorum_insert_select_with_old_data_and_without_quorum_zookeeper_long.sql
@@ -17,7 +17,6 @@ SYSTEM SYNC REPLICA quorum2;
 
 SET select_sequential_consistency=1;
 SET insert_quorum=2, insert_quorum_parallel=0;
-SET insert_keeper_fault_injection_probability=0;
 
 SET insert_quorum_timeout=0;
 
diff --git a/tests/queries/0_stateless/00732_quorum_insert_simple_test_1_parts_zookeeper_long.sql b/tests/queries/0_stateless/00732_quorum_insert_simple_test_1_parts_zookeeper_long.sql
index 22fb40f9f85..4eb263c75c2 100644
--- a/tests/queries/0_stateless/00732_quorum_insert_simple_test_1_parts_zookeeper_long.sql
+++ b/tests/queries/0_stateless/00732_quorum_insert_simple_test_1_parts_zookeeper_long.sql
@@ -11,7 +11,6 @@ CREATE TABLE quorum2(x UInt32, y Date) ENGINE ReplicatedMergeTree('/clickhouse/t
 
 SET insert_quorum=2, insert_quorum_parallel=0;
 SET select_sequential_consistency=1;
-SET insert_keeper_fault_injection_probability=0;
 
 INSERT INTO quorum1 VALUES (1, '2018-11-15');
 INSERT INTO quorum1 VALUES (2, '2018-11-15');
diff --git a/tests/queries/0_stateless/00732_quorum_insert_simple_test_2_parts_zookeeper_long.sql b/tests/queries/0_stateless/00732_quorum_insert_simple_test_2_parts_zookeeper_long.sql
index a97b7438da0..7fb23936819 100644
--- a/tests/queries/0_stateless/00732_quorum_insert_simple_test_2_parts_zookeeper_long.sql
+++ b/tests/queries/0_stateless/00732_quorum_insert_simple_test_2_parts_zookeeper_long.sql
@@ -11,7 +11,6 @@ CREATE TABLE quorum2(x UInt32, y Date) ENGINE ReplicatedMergeTree('/clickhouse/t
 
 SET insert_quorum=2, insert_quorum_parallel=0;
 SET select_sequential_consistency=1;
-SET insert_keeper_fault_injection_probability=0;
 
 INSERT INTO quorum1 VALUES (1, '2018-11-15');
 INSERT INTO quorum1 VALUES (2, '2018-11-15');
diff --git a/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.reference b/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.reference
index 3de05d66188..dd5860ae491 100644
--- a/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.reference
+++ b/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.reference
@@ -6,7 +6,7 @@
 │ name2 │                   1 │                 0 │                 0 │                  0 │
 │ name3 │                   0 │                 0 │                 0 │                  0 │
 └───────┴─────────────────────┴───────────────────┴───────────────────┴────────────────────┘
-231	1
+3	231	1
 ┌─name────────────────┬─partition_key─┬─sorting_key───┬─primary_key─┬─sampling_key─┐
 │ check_system_tables │ date          │ date, version │ date        │              │
 └─────────────────────┴───────────────┴───────────────┴─────────────┴──────────────┘
@@ -51,3 +51,6 @@ Check total_bytes/total_rows for Set
 Check total_bytes/total_rows for Join
 1	50
 1	100
+Check total_uncompressed_bytes/total_bytes/total_rows for Materialized views
+0	0	0
+1	1	1
diff --git a/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql b/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql
index ae9db656f00..51818228913 100644
--- a/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql
+++ b/tests/queries/0_stateless/00753_system_columns_and_system_tables_long.sql
@@ -23,7 +23,7 @@ FROM system.columns WHERE table = 'check_system_tables' AND database = currentDa
 FORMAT PrettyCompactNoEscapes;
 
 INSERT INTO check_system_tables VALUES (1, 1, 1);
-SELECT total_bytes, total_rows FROM system.tables WHERE name = 'check_system_tables' AND database = currentDatabase();
+SELECT total_bytes_uncompressed, total_bytes, total_rows FROM system.tables WHERE name = 'check_system_tables' AND database = currentDatabase();
 
 DROP TABLE IF EXISTS check_system_tables;
 
@@ -138,3 +138,23 @@ SELECT total_bytes BETWEEN 5000 AND 15000, total_rows FROM system.tables WHERE n
 INSERT INTO check_system_tables SELECT number+50 FROM numbers(50);
 SELECT total_bytes BETWEEN 5000 AND 15000, total_rows FROM system.tables WHERE name = 'check_system_tables' AND database = currentDatabase();
 DROP TABLE check_system_tables;
+
+-- Build MergeTree table for Materialized view
+CREATE TABLE check_system_tables
+  (
+    name1 UInt8,
+    name2 UInt8,
+    name3 UInt8
+  ) ENGINE = MergeTree()
+    ORDER BY name1
+    PARTITION BY name2
+    SAMPLE BY name1
+    SETTINGS min_bytes_for_wide_part = 0, compress_marks = false, compress_primary_key = false, ratio_of_defaults_for_sparse_serialization = 1;
+
+SELECT 'Check total_uncompressed_bytes/total_bytes/total_rows for Materialized views';
+CREATE MATERIALIZED VIEW check_system_tables_mv ENGINE = MergeTree() ORDER BY name2 AS SELECT name1, name2, name3 FROM check_system_tables;
+SELECT total_bytes_uncompressed, total_bytes, total_rows FROM system.tables WHERE name = 'check_system_tables_mv' AND database = currentDatabase();
+INSERT INTO check_system_tables VALUES (1, 1, 1);
+SELECT total_bytes_uncompressed > 0, total_bytes > 0, total_rows FROM system.tables WHERE name = 'check_system_tables_mv' AND database = currentDatabase();
+DROP TABLE check_system_tables_mv;
+DROP TABLE check_system_tables;
diff --git a/tests/queries/0_stateless/00808_not_optimize_predicate.sql b/tests/queries/0_stateless/00808_not_optimize_predicate.sql
index ba8f5eb5753..d0dda14e026 100644
--- a/tests/queries/0_stateless/00808_not_optimize_predicate.sql
+++ b/tests/queries/0_stateless/00808_not_optimize_predicate.sql
@@ -48,7 +48,8 @@ SELECT
     intDiv(number, 25) AS n,
     avgState(number) AS s
 FROM numbers(2500)
-GROUP BY n;
+GROUP BY n
+ORDER BY n;
 
 SET force_primary_key = 1, enable_optimize_predicate_expression = 1;
 
@@ -60,7 +61,8 @@ FROM
         finalizeAggregation(s)
     FROM test_00808_push_down_with_finalizeAggregation
 )
-WHERE (n >= 2) AND (n <= 5);
+WHERE (n >= 2) AND (n <= 5)
+ORDER BY n;
 
 EXPLAIN SYNTAX SELECT *
 FROM
diff --git a/tests/queries/0_stateless/00877_memory_limit_for_new_delete.sql b/tests/queries/0_stateless/00877_memory_limit_for_new_delete.sql
index 3864293751f..8eb9d83b730 100644
--- a/tests/queries/0_stateless/00877_memory_limit_for_new_delete.sql
+++ b/tests/queries/0_stateless/00877_memory_limit_for_new_delete.sql
@@ -2,6 +2,7 @@
 -- Tag no-msan: memory limits don't work correctly under msan because it replaces malloc/free
 
 SET max_memory_usage = 1000000000;
+SET max_bytes_before_external_group_by = 0;
 
 SELECT sum(ignore(*)) FROM (
     SELECT number, argMax(number, (number, toFixedString(toString(number), 1024)))
diff --git a/tests/queries/0_stateless/00933_ttl_simple.reference b/tests/queries/0_stateless/00933_ttl_simple.reference
index e3982814eab..72f5134e235 100644
--- a/tests/queries/0_stateless/00933_ttl_simple.reference
+++ b/tests/queries/0_stateless/00933_ttl_simple.reference
@@ -6,11 +6,11 @@
 2000-10-10 00:00:00	0
 2100-10-10 00:00:00	3
 2100-10-10	2
-CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL now() - 1000\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL CAST(\'2000-10-10 00:00:00\', \'DateTime\')\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
 1	0
-CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL now() + 1000\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL CAST(\'2100-10-10 00:00:00\', \'DateTime\')\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
 1	1
-CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL today() - 1\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL CAST(\'2000-10-10\', \'Date\')\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
 1	0
-CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL today() + 1\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
+CREATE TABLE default.ttl_00933_1\n(\n    `b` Int32,\n    `a` Int32 TTL CAST(\'2100-10-10\', \'Date\')\n)\nENGINE = MergeTree\nPARTITION BY tuple()\nORDER BY tuple()\nSETTINGS min_bytes_for_wide_part = 0, index_granularity = 8192
 1	1
diff --git a/tests/queries/0_stateless/00933_ttl_simple.sql b/tests/queries/0_stateless/00933_ttl_simple.sql
index ad40e7c7e47..c1df338a0ff 100644
--- a/tests/queries/0_stateless/00933_ttl_simple.sql
+++ b/tests/queries/0_stateless/00933_ttl_simple.sql
@@ -8,7 +8,8 @@
 --     ┌───────────────now()─┬─toDate(toTimeZone(now(), 'America/Mazatlan'))─┬────today()─┐
 --     │ 2023-07-24 06:24:06 │                                    2023-07-23 │ 2023-07-24 │
 --     └─────────────────────┴───────────────────────────────────────────────┴────────────┘
-set session_timezone = '';
+SET session_timezone = '';
+SET allow_suspicious_ttl_expressions = 1;
 
 drop table if exists ttl_00933_1;
 
@@ -65,7 +66,9 @@ select * from ttl_00933_1 order by d;
 
 -- const DateTime TTL positive
 drop table if exists ttl_00933_1;
-create table ttl_00933_1 (b Int, a Int ttl now()-1000) engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
+create table ttl_00933_1 (b Int, a Int ttl '2000-10-10 00:00:00'::DateTime)
+engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
+
 show create table ttl_00933_1;
 insert into ttl_00933_1 values (1, 1);
 optimize table ttl_00933_1 final;
@@ -73,7 +76,7 @@ select * from ttl_00933_1;
 
 -- const DateTime TTL negative
 drop table if exists ttl_00933_1;
-create table ttl_00933_1 (b Int, a Int ttl now()+1000) engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
+create table ttl_00933_1 (b Int, a Int ttl '2100-10-10 00:00:00'::DateTime) engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
 show create table ttl_00933_1;
 insert into ttl_00933_1 values (1, 1);
 optimize table ttl_00933_1 final;
@@ -81,7 +84,7 @@ select * from ttl_00933_1;
 
 -- const Date TTL positive
 drop table if exists ttl_00933_1;
-create table ttl_00933_1 (b Int, a Int ttl today()-1) engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
+create table ttl_00933_1 (b Int, a Int ttl '2000-10-10'::Date) engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
 show create table ttl_00933_1;
 insert into ttl_00933_1 values (1, 1);
 optimize table ttl_00933_1 final;
@@ -89,7 +92,7 @@ select * from ttl_00933_1;
 
 -- const Date TTL negative
 drop table if exists ttl_00933_1;
-create table ttl_00933_1 (b Int, a Int ttl today()+1) engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
+create table ttl_00933_1 (b Int, a Int ttl '2100-10-10'::Date) engine = MergeTree order by tuple() partition by tuple() settings min_bytes_for_wide_part = 0;
 show create table ttl_00933_1;
 insert into ttl_00933_1 values (1, 1);
 optimize table ttl_00933_1 final;
diff --git a/tests/queries/0_stateless/00947_ml_test.sql b/tests/queries/0_stateless/00947_ml_test.sql
index 94e4f3b4626..72000103a44 100644
--- a/tests/queries/0_stateless/00947_ml_test.sql
+++ b/tests/queries/0_stateless/00947_ml_test.sql
@@ -40,10 +40,10 @@ INSERT INTO grouptest VALUES
 (1, 1.732, 3.653, 11.422), (1, 2.150, 2.103, 7.609), (1, 0.061, 3.310, 7.052), (1, 1.030, 3.671, 10.075), (1, 1.879, 0.578, 2.492), (1, 0.922, 2.552, 6.499), (1, 1.145, -0.095, -0.993), (1, 1.920, 0.373, 1.959), (1, 0.458, 0.094, -1.801), (1, -0.118, 3.273, 6.582), (1, 2.667, 1.472, 6.752), (1, -0.387, -0.529, -5.360), (1, 2.219, 1.790, 6.810), (1, -0.754, 2.139, 1.908), (1, -0.446, -0.668, -5.896), (1, 1.729, 0.914, 3.199), (1, 2.908, -0.420, 1.556), (1, 1.645, 3.581, 11.034), (1, 0.358, -0.950, -5.136), (1, -0.467, 2.339, 3.084), (1, 3.629, 2.959, 13.135), (1, 2.393, 0.926, 4.563), (1, -0.945, 0.281, -4.047), (1, 3.688, -0.570, 2.667), (1, 3.016, 1.775, 8.356), (1, 2.571, 0.139, 2.559), (1, 2.999, 0.956, 5.866), (1, 1.754, -0.809, -1.920), (1, 3.943, 0.382, 6.030), (1, -0.970, 2.315, 2.004), (1, 1.503, 0.790, 2.376), (1, -0.775, 2.563, 3.139), (1, 1.211, 0.113, -0.240), (1, 3.058, 0.977, 6.048), (1, 2.729, 1.634, 7.360), (1, 0.307, 2.759, 5.893), (1, 3.272, 0.181, 4.089), (1, 1.192, 1.963, 5.273), (1, 0.931, 1.447, 3.203), (1, 3.835, 3.447, 15.011), (1, 0.709, 0.008, -1.559), (1, 3.155, -0.676, 1.283), (1, 2.342, 1.047, 4.824), (1, 2.059, 1.262, 4.903), (1, 2.797, 0.855, 5.159), (1, 0.387, 0.645, -0.292), (1, 1.418, 0.408, 1.060), (1, 2.719, -0.826, -0.039), (1, 2.735, 3.736, 13.678), (1, 0.205, 0.777, -0.260), (1, 3.117, 2.063, 9.424), (1, 0.601, 0.178, -1.263), (1, 0.064, 0.157, -2.401), (1, 3.104, -0.455, 1.842), (1, -0.253, 0.672, -1.490), (1, 2.592, -0.408, 0.961), (1, -0.909, 1.314, -0.878), (1, 0.625, 2.594, 6.031), (1, 2.749, -0.210, 1.869), (1, -0.469, 1.532, 0.657), (1, 1.954, 1.827, 6.388), (1, -0.528, 1.136, -0.647), (1, 0.802, -0.583, -3.146), (1, -0.176, 1.584, 1.400), (1, -0.705, -0.785, -6.766), (1, 1.660, 2.365, 7.416), (1, 2.278, 3.977, 13.485), (1, 2.846, 3.845, 14.229), (1, 3.588, -0.401, 2.974), (1, 3.525, 3.831, 15.542), (1, 0.191, 3.312, 7.318), (1, 2.615, -0.287, 1.370), (1, 2.701, -0.446, 1.064), (1, 2.065, -0.556, -0.538), (1, 2.572, 3.618, 12.997), (1, 3.743, -0.708, 2.362), (1, 3.734, 2.319, 11.425), (1, 3.768, 2.777, 12.866), (1, 3.203, 0.958, 6.280), (1, 1.512, 2.635, 7.927), (1, 2.194, 2.323, 8.356), (1, -0.726, 2.729, 3.735), (1, 0.020, 1.704, 2.152), (1, 2.173, 2.856, 9.912), (1, 3.124, 1.705, 8.364), (1, -0.834, 2.142, 1.759), (1, -0.702, 3.024, 4.666), (1, 1.393, 0.583, 1.535), (1, 2.136, 3.770, 12.581), (1, -0.445, 0.991, -0.917), (1, 0.244, -0.835, -5.016), (1, 2.789, 0.691, 4.652), (1, 0.246, 2.661, 5.475), (1, 3.793, 2.671, 12.601), (1, 1.645, -0.973, -2.627), (1, 2.405, 1.842, 7.336), (1, 3.221, 3.109, 12.769), (1, -0.638, 3.220, 5.385), (1, 1.836, 3.025, 9.748), (1, -0.660, 1.818, 1.133), (1, 0.901, 0.981, 1.744), (1, -0.236, 3.087, 5.789), (1, 1.744, 3.864, 12.078), (1, -0.166, 3.186, 6.226), (1, 3.536, -0.090, 3.803), (1, 3.284, 2.026, 9.648), (1, 1.327, 2.822, 8.119), (1, -0.709, 0.105, -4.104), (1, 0.509, -0.989, -4.949), (1, 0.180, -0.934, -5.440), (1, 3.522, 1.374, 8.168), (1, 1.497, -0.764, -2.297), (1, 1.696, 2.364, 7.482), (1, -0.202, -0.032, -3.500), (1, 3.109, -0.138, 2.804), (1, -0.238, 2.992, 5.501), (1, 1.639, 1.634, 5.181), (1, 1.919, 0.341, 1.859), (1, -0.563, 1.750, 1.124), (1, 0.886, 3.589, 9.539), (1, 3.619, 3.020, 13.299), (1, 1.703, -0.493, -1.073), (1, 2.364, 3.764, 13.022), (1, 1.820, 1.854, 6.201), (1, 1.437, -0.765, -2.421), (1, 1.396, 0.959, 2.668), (1, 2.608, 2.032, 8.312), (1, 0.333, -0.040, -2.455), (1, 3.441, 0.824, 6.355), (1, 1.303, 2.767, 7.908), (1, 1.359, 2.404, 6.932), (1, 0.674, 0.241, -0.930), (1, 2.708, -0.077, 2.183), (1, 3.821, 3.215, 14.287), (1, 3.316, 1.591, 8.404), (1, -0.848, 1.145, -1.259), (1, 3.455, 3.081, 13.153), (1, 2.568, 0.259, 2.914), (1, 2.866, 2.636, 10.642), (1, 2.776, -0.309, 1.626), (1, 2.087, 0.619, 3.031), (1, 1.682, 1.201, 3.967), (1, 3.800, 2.600, 12.399), (1, 3.344, -0.780, 1.347), (1, 1.053, -0.817, -3.346), (1, 0.805, 3.085, 7.865), (1, 0.173, 0.069, -2.449), (1, 2.018, 1.309, 4.964), (1, 3.713, 3.804, 15.838), (1, 3.805, -0.063, 4.421), (1, 3.587, 2.854, 12.738), (1, 2.426, -0.179, 1.315), (1, 0.535, 0.572, -0.213), (1, -0.558, 0.142, -3.690), (1, -0.875, 2.700, 3.349), (1, 2.405, 3.933, 13.610), (1, 1.633, 1.222, 3.934), (1, 0.049, 2.853, 5.657), (1, 1.146, 0.907, 2.015), (1, 0.300, 0.219, -1.744), (1, 2.226, 2.526, 9.029), (1, 2.545, -0.762, -0.198), (1, 2.553, 3.956, 13.974), (1, -0.898, 2.836, 3.713), (1, 3.796, -0.202, 3.985), (1, -0.810, 2.963, 4.268), (1, 0.511, 2.104, 4.334), (1, 3.527, 3.741, 15.275), (1, -0.921, 3.094, 4.440), (1, 0.856, 3.108, 8.036), (1, 0.815, 0.565, 0.323), (1, 3.717, 0.693, 6.512), (1, 3.052, 3.558, 13.778), (1, 2.942, 3.034, 11.986), (1, 0.765, 3.177, 8.061), (1, 3.175, -0.525, 1.776), (1, 0.309, 1.006, 0.638), (1, 1.922, 0.835, 3.349), (1, 3.678, 3.314, 14.297), (1, 2.840, -0.486, 1.221), (1, 1.195, 3.396, 9.578), (1, -0.157, 3.122, 6.053), (1, 2.404, 1.434, 6.110), (1, 3.108, 2.210, 9.845), (1, 2.289, 1.188, 5.142), (1, -0.319, -0.044, -3.769), (1, -0.625, 3.701, 6.854), (1, 2.269, -0.276, 0.710), (1, 0.777, 1.963, 4.442), (1, 0.411, 1.893, 3.501), (1, 1.173, 0.461, 0.728), (1, 1.767, 3.077, 9.765), (1, 0.853, 3.076, 7.933), (1, -0.013, 3.149, 6.421), (1, 3.841, 1.526, 9.260), (1, -0.950, 0.277, -4.070), (1, -0.644, -0.747, -6.527), (1, -0.923, 1.733, 0.353), (1, 0.044, 3.037, 6.201), (1, 2.074, 2.494, 8.631), (1, 0.016, 0.961, -0.085), (1, -0.780, -0.448, -5.904), (1, 0.170, 1.936, 3.148), (1, -0.420, 3.730, 7.349), (1, -0.630, 1.504, 0.254), (1, -0.006, 0.045, -2.879), (1, 1.101, -0.985, -3.753), (1, 1.618, 0.555, 1.900), (1, -0.336, 1.408, 0.552), (1, 1.086, 3.284, 9.024), (1, -0.815, 2.032, 1.466), (1, 3.144, -0.380, 2.148), (1, 2.326, 2.077, 7.883), (1, -0.571, 0.964, -1.251), (1, 2.416, 1.255, 5.595), (1, 3.964, 1.379, 9.065), (1, 3.897, 1.553, 9.455), (1, 1.806, 2.667, 8.611), (1, 0.323, 3.809, 9.073), (1, 0.501, 3.256, 7.769), (1, -0.679, 3.539, 6.259), (1, 2.825, 3.856, 14.219), (1, 0.288, -0.536, -4.032), (1, 3.009, 0.725, 5.193), (1, -0.763, 1.140, -1.105), (1, 1.124, 3.807, 10.670), (1, 2.478, 0.204, 2.570), (1, 2.825, 2.639, 10.566), (1, 1.878, -0.883, -1.892), (1, 3.380, 2.942, 12.587), (1, 2.202, 1.739, 6.621), (1, -0.711, -0.680, -6.463), (1, -0.266, 1.827, 1.951), (1, -0.846, 1.003, -1.683), (1, 3.201, 0.132, 3.798), (1, 2.797, 0.085, 2.849), (1, 1.632, 3.269, 10.072), (1, 2.410, 2.727, 10.003), (1, -0.624, 0.853, -1.690), (1, 1.314, 3.268, 9.433), (1, -0.395, 0.450, -2.440), (1, 0.992, 3.168, 8.489), (1, 3.355, 2.106, 10.028), (1, 0.509, -0.888, -4.647), (1, 1.007, 0.797, 1.405), (1, 0.045, 0.211, -2.278), (1, -0.911, 1.093, -1.544), (1, 2.409, 0.273, 2.637), (1, 2.640, 3.540, 12.899), (1, 2.668, -0.433, 1.038), (1, -0.014, 0.341, -2.005), (1, -0.525, -0.344, -5.083), (1, 2.278, 3.517, 12.105), (1, 3.712, 0.901, 7.128), (1, -0.689, 2.842, 4.149), (1, -0.467, 1.263, -0.147), (1, 0.963, -0.653, -3.034), (1, 2.559, 2.590, 9.889), (1, 1.566, 1.393, 4.312), (1, -1.000, 1.809, 0.429), (1, -0.297, 3.221, 6.070), (1, 2.199, 3.820, 12.856), (1, 3.096, 3.251, 12.944), (1, 1.479, 1.835, 5.461), (1, 0.276, 0.773, -0.130), (1, 0.607, 1.382, 2.360), (1, 1.169, -0.108, -0.985), (1, 3.429, 0.475, 5.282), (1, 2.626, 0.104, 2.563), (1, 1.156, 3.512, 9.850), (1, 3.947, 0.796, 7.282), (1, -0.462, 2.425, 3.351), (1, 3.957, 0.366, 6.014), (1, 3.763, -0.330, 3.536), (1, 0.667, 3.361, 8.417), (1, -0.583, 0.892, -1.492), (1, -0.505, 1.344, 0.021), (1, -0.474, 2.714, 4.195), (1, 3.455, 0.014, 3.950), (1, 1.016, 1.828, 4.516), (1, 1.845, 0.193, 1.269), (1, -0.529, 3.930, 7.731), (1, 2.636, 0.045, 2.408), (1, 3.757, -0.918, 1.760), (1, -0.808, 1.160, -1.137), (1, 0.744, 1.435, 2.793), (1, 3.457, 3.566, 14.613), (1, 1.061, 3.140, 8.544), (1, 3.733, 3.368, 14.570), (1, -0.969, 0.879, -2.301), (1, 3.940, 3.136, 14.287), (1, -0.730, 2.107, 1.860), (1, 3.699, 2.820, 12.858), (1, 2.197, -0.636, -0.514), (1, 0.775, -0.979, -4.387), (1, 2.019, 2.828, 9.521), (1, 1.415, 0.113, 0.170), (1, 1.567, 3.410, 10.363), (1, 0.984, -0.960, -3.913), (1, 1.809, 2.487, 8.079), (1, 1.550, 1.130, 3.489), (1, -0.770, 3.027, 4.542), (1, -0.358, 3.326, 6.262), (1, 3.140, 0.096, 3.567), (1, -0.685, 2.213, 2.270), (1, 0.916, 0.692, 0.907), (1, 1.526, 1.159, 3.527), (1, 2.675, -0.568, 0.645), (1, 1.740, 3.019, 9.538), (1, 1.223, 2.088, 5.709), (1, 1.572, -0.125, -0.230), (1, 3.641, 0.362, 5.369), (1, 2.944, 3.897, 14.578), (1, 2.775, 2.461, 9.932), (1, -0.200, 2.492, 4.076), (1, 0.065, 2.055, 3.296), (1, 2.375, -0.639, -0.167), (1, -0.133, 1.138, 0.149), (1, -0.385, 0.163, -3.281), (1, 2.200, 0.863, 3.989), (1, -0.470, 3.492, 6.536), (1, -0.916, -0.547, -6.472), (1, 0.634, 0.927, 1.049), (1, 2.930, 2.655, 10.825), (1, 3.094, 2.802, 11.596), (1, 0.457, 0.539, -0.470), (1, 1.277, 2.229, 6.240), (1, -0.157, 1.270, 0.496), (1, 3.320, 0.640, 5.559), (1, 2.836, 1.067, 5.872), (1, 0.921, -0.716, -3.307), (1, 3.886, 1.487, 9.233), (1, 0.306, -0.142, -2.815), (1, 3.727, -0.410, 3.225), (1, 1.268, -0.801, -2.866), (1, 2.302, 2.493, 9.084), (1, 0.331, 0.373, -1.220), (1, 3.224, -0.857, 0.879), (1, 1.328, 2.786, 8.014), (1, 3.639, 1.601, 9.081), (1, 3.201, -0.484, 1.949), (1, 3.447, -0.734, 1.692), (1, 2.773, -0.143, 2.117), (1, 1.517, -0.493, -1.445), (1, 1.778, -0.428, -0.728), (1, 3.989, 0.099, 5.274), (1, 1.126, 3.985, 11.206), (1, 0.348, 0.756, -0.035), (1, 2.399, 2.576, 9.525), (1, 0.866, 1.800, 4.132), (1, 3.612, 1.598, 9.017), (1, 0.495, 2.239, 4.707), (1, 2.442, 3.712, 13.019), (1, 0.238, -0.844, -5.057), (1, 1.404, 3.095, 9.093), (1, 2.842, 2.044, 8.816), (1, 0.622, 0.322, -0.791), (1, -0.561, 1.242, -0.395), (1, 0.679, 3.822, 9.823), (1, 1.875, 3.526, 11.327), (1, 3.587, 1.050, 7.324), (1, 1.467, 0.588, 1.699), (1, 3.180, 1.571, 8.074), (1, 1.402, 0.430, 1.093), (1, 1.834, 2.209, 7.294), (1, 3.542, -0.259, 3.306), (1, -0.517, 0.174, -3.513), (1, 3.549, 2.210, 10.729), (1, 2.260, 3.393, 11.699), (1, 0.036, 1.893, 2.751), (1, 0.680, 2.815, 6.804), (1, 0.219, 0.368, -1.459), (1, -0.519, 3.987, 7.924), (1, 0.974, 0.761, 1.231), (1, 0.107, 0.620, -0.927), (1, 1.513, 1.910, 5.755), (1, 3.114, 0.894, 5.910), (1, 3.061, 3.052, 12.276), (1, 2.556, 3.779, 13.448), (1, 1.964, 2.692, 9.002), (1, 3.894, -0.032, 4.690), (1, -0.693, 0.910, -1.655), (1, 2.692, 2.908, 11.108), (1, -0.824, 1.190, -1.078), (1, 3.621, 0.918, 6.997), (1, 3.190, 2.442, 10.707), (1, 1.424, -0.546, -1.791), (1, 2.061, -0.427, -0.158), (1, 1.532, 3.158, 9.540), (1, 0.648, 3.557, 8.967), (1, 2.511, 1.665, 7.017), (1, 1.903, -0.168, 0.302), (1, -0.186, -0.718, -5.528), (1, 2.421, 3.896, 13.531), (1, 3.063, 1.841, 8.650), (1, 0.636, 1.699, 3.367), (1, 1.555, 0.688, 2.174), (1, -0.412, 0.454, -2.462), (1, 1.645, 3.207, 9.911), (1, 3.396, 3.766, 15.090), (1, 0.375, -0.256, -3.017), (1, 3.636, 0.732, 6.469), (1, 2.503, 3.133, 11.405), (1, -0.253, 0.693, -1.429), (1, 3.178, 3.110, 12.686), (1, 3.282, -0.725, 1.388), (1, -0.297, 1.222, 0.070), (1, 1.872, 3.211, 10.377), (1, 3.471, 1.446, 8.278), (1, 2.891, 0.197, 3.374), (1, -0.896, 2.198, 1.802), (1, 1.178, -0.717, -2.796), (1, 0.650, 3.371, 8.412), (1, 0.447, 3.248, 7.637), (1, 1.616, -0.109, -0.097), (1, 1.837, 1.092, 3.951), (1, 0.767, 1.384, 2.684), (1, 3.466, -0.600, 2.133), (1, -0.800, -0.734, -6.802), (1, -0.534, 0.068, -3.865), (1, 3.416, -0.459, 2.455), (1, 0.800, -0.132, -1.795), (1, 2.150, 1.190, 4.869), (1, 0.830, 1.220, 2.319), (1, 2.656, 2.587, 10.072), (1, 0.375, -0.219, -2.906), (1, 0.582, -0.637, -3.749), (1, 0.588, -0.723, -3.992), (1, 3.875, 2.126, 11.127), (1, -0.476, 1.909, 1.775), (1, 0.963, 3.597, 9.716), (1, -0.888, 3.933, 7.021), (1, 1.711, -0.868, -2.184), (1, 3.244, 1.990, 9.460), (1, -0.057, 1.537, 1.497), (1, -0.015, 3.511, 7.504), (1, 0.280, 0.582, -0.695), (1, 2.402, 2.731, 9.998), (1, 2.053, 2.253, 7.865), (1, 1.955, 0.172, 1.424), (1, 3.746, 0.872, 7.107), (1, -0.157, 2.381, 3.829), (1, 3.548, -0.918, 1.340), (1, 2.449, 3.195, 11.482), (1, 1.582, 1.055, 3.329), (1, 1.908, -0.839, -1.700), (1, 2.341, 3.137, 11.091), (1, -0.043, 3.873, 8.532), (1, 0.528, -0.752, -4.198), (1, -0.940, 0.261, -4.098), (1, 2.609, 3.531, 12.812), (1, 2.439, 2.486, 9.336), (1, -0.659, -0.150, -4.768), (1, 2.131, 1.973, 7.181), (1, 0.253, 0.304, -1.583), (1, -0.169, 2.273, 3.480), (1, 1.855, 3.974, 12.631), (1, 0.092, 1.160, 0.666), (1, 3.990, 0.402, 6.187), (1, -0.455, 0.932, -1.113), (1, 2.365, 1.152, 5.185), (1, -0.058, 1.244, 0.618), (1, 0.674, 0.481, -0.209), (1, 3.002, 0.246, 3.743), (1, 1.804, 3.765, 11.902), (1, 3.567, -0.752, 1.876), (1, 0.098, 2.257, 3.968), (1, 0.130, -0.889, -5.409), (1, 0.633, 1.891, 3.940), (1, 0.421, 2.533, 5.440), (1, 2.252, 1.853, 7.063), (1, 3.191, -0.980, 0.443), (1, -0.776, 3.241, 5.171), (1, 0.509, 1.737, 3.229), (1, 3.583, 1.274, 7.986), (1, 1.101, 2.896, 7.891), (1, 3.072, -0.008, 3.120), (1, 2.945, -0.295, 2.006), (1, 3.621, -0.161, 3.760), (1, 1.399, 3.759, 11.075), (1, 3.783, -0.866, 1.968), (1, -0.241, 2.902, 5.225), (1, 1.323, 1.934, 5.449), (1, 1.449, 2.855, 8.464), (1, 0.088, 1.526, 1.753), (1, -1.000, 2.161, 1.485), (1, -0.214, 3.358, 6.647), (1, -0.384, 3.230, 5.921), (1, 3.146, 1.228, 6.975), (1, 1.917, 0.860, 3.415), (1, 1.982, 1.735, 6.167), (1, 1.404, 1.851, 5.360), (1, 2.428, -0.674, -0.166), (1, 2.081, -0.505, -0.352), (1, 0.914, -0.543, -2.802), (1, -0.029, -0.482, -4.506), (1, 0.671, 0.184, -1.105), (1, 1.641, -0.524, -1.292), (1, 1.005, 0.361, 0.094), (1, -0.493, 3.582, 6.760), (2, 3.876, 2.563, 21.500), (2, 0.159, -0.309, 7.986), (2, -0.496, 0.417, 12.998), (2, -0.164, -0.512, 7.092), (2, 0.632, 3.200, 28.571), (2, 3.772, 0.493, 9.188), (2, 2.430, -0.797, 2.789), (2, 3.872, -0.775, 1.475), (2, -0.031, -0.256, 8.495), (2, 2.726, 3.000, 25.271), (2, 1.116, -0.269, 7.269), (2, 0.551, 3.402, 29.860), (2, 0.820, 2.500, 24.179), (2, 1.153, -0.453, 6.131), (2, -0.717, -0.360, 8.556), (2, 0.532, 0.531, 12.654), (2, 2.096, 0.981, 13.791), (2, 0.146, -0.433, 7.259), (2, 1.000, 1.075, 15.452), (2, 2.963, -0.090, 6.495), (2, 1.047, 2.052, 21.267), (2, 0.882, 1.778, 19.785), (2, 1.380, 2.702, 24.832), (2, 1.853, 0.401, 10.554), (2, 2.004, 1.770, 18.618), (2, 3.377, 0.772, 11.253), (2, 1.227, -0.169, 7.759), (2, 0.428, 2.052, 21.885), (2, 0.070, 3.648, 31.816), (2, 0.128, -0.938, 4.244), (2, 2.061, 0.753, 12.454), (2, 1.207, -0.301, 6.989), (2, -0.168, 3.765, 32.757), (2, 3.450, 1.801, 17.353), (2, -0.483, 3.344, 30.547), (2, 1.847, 1.884, 19.455), (2, 3.241, 2.369, 20.975), (2, 0.628, 3.590, 30.912), (2, 2.183, 1.741, 18.263), (2, 0.774, 2.638, 25.057), (2, 3.292, 2.867, 23.912), (2, 0.056, 2.651, 25.850), (2, -0.506, 0.300, 12.308), (2, 0.524, 1.182, 16.570), (2, -0.267, 2.563, 25.647), (2, 3.953, -0.334, 4.040), (2, 2.507, 2.319, 21.408), (2, -0.770, 1.017, 16.875), (2, 0.481, 1.591, 19.062), (2, 3.243, 1.060, 13.114), (2, 2.178, -0.325, 5.873), (2, 2.510, 1.235, 14.900), (2, 2.684, 2.370, 21.535), (2, 3.466, 3.656, 28.469), (2, 2.994, 3.960, 30.764), (2, -0.363, 3.592, 31.917), (2, 1.738, 0.074, 8.708), (2, 1.462, 3.727, 30.902), (2, 0.059, 0.180, 11.021), (2, 2.980, 2.317, 20.925), (2, 1.248, 0.965, 14.545), (2, 0.776, -0.229, 7.850), (2, -0.562, 2.839, 27.598), (2, 3.581, 0.244, 7.883), (2, -0.958, 0.901, 16.362), (2, 3.257, 0.364, 8.925), (2, 1.478, 1.718, 18.827), (2, -0.121, -0.436, 7.507), (2, 0.966, 1.444, 17.697), (2, 3.631, 3.463, 27.144), (2, 0.174, -0.663, 5.848), (2, 2.783, 0.124, 7.959), (2, 1.106, -0.936, 3.276), (2, 0.186, -0.942, 4.162), (2, 3.513, 2.456, 21.222), (2, 0.339, 2.316, 23.558), (2, 0.566, 2.515, 24.523), (2, -0.134, 0.746, 14.607), (2, 1.554, 0.106, 9.084), (2, -0.846, 2.748, 27.337), (2, 3.934, 0.564, 9.451), (2, 2.840, -0.966, 1.366), (2, 1.379, 0.307, 10.463), (2, 1.065, -0.780, 4.253), (2, 3.324, 2.145, 19.546), (2, 0.974, -0.543, 5.767), (2, 2.469, 3.976, 31.385), (2, -0.434, 3.689, 32.570), (2, 0.261, 0.481, 12.624), (2, 3.786, 2.605, 21.843), (2, -0.460, -0.536, 7.243), (2, 2.576, 2.880, 24.702), (2, -0.501, 3.551, 31.810), (2, 2.946, 3.263, 26.633), (2, 2.959, -0.813, 2.162), (2, -0.749, 0.490, 13.686), (2, 2.821, 0.335, 9.187), (2, 3.964, 0.272, 7.667), (2, 0.808, -0.700, 4.994), (2, 0.415, 2.183, 22.682), (2, 2.551, 3.785, 30.156), (2, 0.821, 1.120, 15.897), (2, 1.714, 3.019, 26.400), (2, 2.265, 1.950, 19.438), (2, 1.493, 3.317, 28.409), (2, -0.445, 2.282, 24.134), (2, -0.508, 2.508, 25.553), (2, 1.017, -0.621, 5.255), (2, 1.053, 2.246, 22.422), (2, 0.441, 1.637, 19.382), (2, 3.657, 1.246, 13.816), (2, 0.756, 0.808, 14.095), (2, 1.849, 1.599, 17.742), (2, 1.782, -0.000, 8.215), (2, 1.136, 3.940, 32.506), (2, 2.814, 3.288, 26.916), (2, 3.180, 3.198, 26.008), (2, 0.728, -0.054, 8.946), (2, 0.801, 0.775, 13.852), (2, 1.399, -0.546, 5.322), (2, 1.415, 1.753, 19.103), (2, 2.860, 1.796, 17.913), (2, 0.712, 2.902, 26.699), (2, -0.389, 3.093, 28.945), (2, 3.661, 3.666, 28.333), (2, 3.944, 0.996, 12.030), (2, 1.655, 1.385, 16.657), (2, 0.122, -0.662, 5.906), (2, 3.667, 2.763, 22.912), (2, 2.606, 0.630, 11.172), (2, -0.291, 1.492, 19.242), (2, -0.787, 1.223, 18.125), (2, 2.405, 0.325, 9.545), (2, 3.129, -0.412, 4.398), (2, 0.588, 3.964, 33.194), (2, -0.177, 3.636, 31.993), (2, 2.079, 3.280, 27.603), (2, 3.055, 3.958, 30.692), (2, -0.164, 3.188, 29.292), (2, 3.803, 3.151, 25.105), (2, 3.123, -0.891, 1.531), (2, 3.070, -0.824, 1.988), (2, 3.103, -0.931, 1.309), (2, 0.589, 3.353, 29.529), (2, 1.095, 1.973, 20.744), (2, -0.557, 0.370, 12.775), (2, 1.223, 0.307, 10.620), (2, 3.255, -0.768, 2.136), (2, 0.508, 2.157, 22.435), (2, 0.373, 0.319, 11.544), (2, 1.240, 1.736, 19.177), (2, 1.846, 0.970, 13.972), (2, 3.352, -0.534, 3.445), (2, -0.352, -0.290, 8.610), (2, 0.281, 0.193, 10.880), (2, 3.450, -0.059, 6.193), (2, 0.310, 2.575, 25.140), (2, 1.791, 1.127, 14.970), (2, 1.992, 2.347, 22.087), (2, -0.288, 2.881, 27.576), (2, 3.464, 3.664, 28.518), (2, 0.573, 2.789, 26.159), (2, 2.265, 1.583, 17.233), (2, 3.203, 0.730, 11.177), (2, 3.345, 1.368, 14.862), (2, 0.891, 3.690, 31.248), (2, 2.252, -0.311, 5.884), (2, -0.087, 0.804, 14.912), (2, 0.153, 2.510, 24.905), (2, 3.533, -0.965, 0.675), (2, 2.035, 1.953, 19.683), (2, 0.316, 2.448, 24.373), (2, 2.199, 3.858, 30.946), (2, -0.519, 3.647, 32.399), (2, 0.867, 1.961, 20.901), (2, 2.739, 2.268, 20.866), (2, 2.462, -0.664, 3.551), (2, 1.372, 3.419, 29.144), (2, -0.628, 2.723, 26.968), (2, 3.989, -0.225, 4.659), (2, 0.166, 3.190, 28.976), (2, 1.681, 2.937, 25.943), (2, 2.979, 2.263, 20.600), (2, 3.896, -0.419, 3.590), (2, 3.861, 2.224, 19.485), (2, -0.087, -0.861, 4.918), (2, 1.182, 1.886, 20.133), (2, 3.622, 2.320, 20.301), (2, 3.560, 0.008, 6.491), (2, 3.082, -0.605, 3.285), (2, 1.777, 1.324, 16.169), (2, 2.269, 2.436, 22.348), (2, 0.019, 3.074, 28.423), (2, -0.560, 3.868, 33.765), (2, 1.568, 2.886, 25.749), (2, 2.045, 0.222, 9.286), (2, 1.391, 0.352, 10.723), (2, 0.172, 1.908, 21.276), (2, 1.173, -0.726, 4.474), (2, 1.642, 2.576, 23.814), (2, 3.346, 1.377, 14.918), (2, 0.120, 0.411, 12.344), (2, 3.913, 0.820, 11.008), (2, 1.054, 3.732, 31.340), (2, 2.284, 0.108, 8.362), (2, 2.266, 0.066, 8.131), (2, 3.204, 1.156, 13.735), (2, 3.243, 2.032, 18.947), (2, 3.052, -0.121, 6.221), (2, 1.131, 2.189, 22.000), (2, 2.958, 0.658, 10.990), (2, 1.717, 3.708, 30.530), (2, 2.417, 2.070, 20.004), (2, 2.175, 0.881, 13.110), (2, 0.333, 3.494, 30.629), (2, 3.598, 3.940, 30.044), (2, 3.683, -0.110, 5.660), (2, 2.555, 1.196, 14.620), (2, 1.511, 0.453, 11.206), (2, 0.903, 1.390, 17.439), (2, -0.897, 3.303, 30.716), (2, 0.245, 2.129, 22.527), (2, 1.370, 2.715, 24.923), (2, 1.822, -0.917, 2.676), (2, 2.690, -0.109, 6.657), (2, 0.206, 1.561, 19.162), (2, 3.905, 2.710, 22.357), (2, -0.438, 3.207, 29.678), (2, 0.898, 3.445, 29.772), (2, 1.838, 2.871, 25.385), (2, 0.116, 1.401, 18.292), (2, -0.408, 2.375, 24.656), (2, 1.681, 3.338, 28.349), (2, 1.177, -0.318, 6.914), (2, 1.004, 0.626, 12.753), (2, 2.840, 2.589, 22.691), (2, 1.258, 3.993, 32.700), (2, 2.016, 3.489, 28.920), (2, -0.728, 0.164, 11.713), (2, 0.193, 1.479, 18.682), (2, 2.647, -0.969, 1.541), (2, 3.837, 2.602, 21.773), (2, 0.541, 0.205, 10.690), (2, 0.026, 2.756, 26.511), (2, 0.924, 0.909, 14.530), (2, 0.974, -0.074, 8.581), (2, 0.081, 0.005, 9.948), (2, 1.331, 2.942, 26.320), (2, 2.498, 3.405, 27.934), (2, 3.741, 1.554, 15.581), (2, 3.502, -0.089, 5.964), (2, 3.069, 1.768, 17.539), (2, 3.115, -0.008, 6.839), (2, 3.237, -0.503, 3.745), (2, 0.768, -0.135, 8.420), (2, 0.410, 3.974, 33.437), (2, 0.238, -0.700, 5.564), (2, 3.619, 0.350, 8.482), (2, 3.563, 3.059, 24.788), (2, 2.916, 3.101, 25.691), (2, 0.144, 3.282, 29.549), (2, 1.288, 2.642, 24.565), (2, -0.859, 0.229, 12.234), (2, 1.507, -0.711, 4.229), (2, -0.634, 2.608, 26.281), (2, 2.054, -0.834, 2.942), (2, 0.453, 1.072, 15.980), (2, 3.914, 1.159, 13.039), (2, 0.254, 1.835, 20.758), (2, 1.577, 0.428, 10.991), (2, 1.990, 3.569, 29.421), (2, 1.584, 1.803, 19.234), (2, 0.835, 3.603, 30.785), (2, 0.900, 3.033, 27.296), (2, 1.180, 0.280, 10.499), (2, 2.400, 2.802, 24.409), (2, 0.924, 2.462, 23.851), (2, 2.138, 0.722, 12.192), (2, -0.253, -0.809, 5.401), (2, 3.570, -0.116, 5.733), (2, 0.201, -0.182, 8.708), (2, 2.457, 0.454, 10.267), (2, -0.053, 0.443, 12.709), (2, 2.108, 2.069, 20.309), (2, -0.964, -0.441, 8.318), (2, 1.802, 0.403, 10.614), (2, 3.704, 3.902, 29.711), (2, 1.904, 2.418, 22.603), (2, 2.965, 3.429, 27.606), (2, -0.801, -0.072, 10.370), (2, 3.009, 0.491, 9.937), (2, 2.781, 1.026, 13.376), (2, -0.421, 0.744, 14.883), (2, 3.639, -0.148, 5.476), (2, 0.584, 2.041, 21.663), (2, 1.547, -0.391, 6.107), (2, -0.204, 0.727, 14.564), (2, 0.372, 0.464, 12.410), (2, 1.185, 1.732, 19.207), (2, 3.574, 0.755, 10.954), (2, 2.164, 1.425, 16.385), (2, 1.895, 1.374, 16.351), (2, 2.352, 2.188, 20.779), (2, 0.187, 0.677, 13.874), (2, -0.589, 3.686, 32.703), (2, 3.081, 0.414, 9.403), (2, 3.341, 3.246, 26.137), (2, 0.617, -0.201, 8.174), (2, 1.518, 3.833, 31.481), (2, 2.613, -0.350, 5.286), (2, 3.426, 0.751, 11.082), (2, 2.726, 3.586, 28.787), (2, 2.834, -0.219, 5.855), (2, 1.038, 3.607, 30.605), (2, 0.479, 1.226, 16.874), (2, 1.729, 0.297, 10.053), (2, 0.050, 1.815, 20.841), (2, -0.554, 3.538, 31.782), (2, 2.773, 0.973, 13.064), (2, -0.239, 3.425, 30.786), (2, 3.611, 3.700, 28.590), (2, 1.418, 3.625, 30.332), (2, 1.599, 1.626, 18.156), (2, 1.841, 1.518, 17.269), (2, 1.119, 1.996, 20.856), (2, 2.810, 2.293, 20.947), (2, 1.174, 2.062, 21.198), (2, -0.326, -0.279, 8.655), (2, -0.365, 0.816, 15.259), (2, 1.296, -0.095, 8.132), (2, -0.263, 0.511, 13.327), (2, 1.757, 3.012, 26.314), (2, 1.849, 1.065, 14.539), (2, 1.651, 2.244, 21.814), (2, 3.942, 1.026, 12.214), (2, 2.314, 1.944, 19.353), (2, 3.055, -0.002, 6.930), (2, 0.402, 1.350, 17.698), (2, 0.004, 2.288, 23.724), (2, 3.265, 2.962, 24.509), (2, 1.044, -0.684, 4.850), (2, -0.280, 2.278, 23.948), (2, 1.216, 0.726, 13.142), (2, 3.181, 3.518, 27.925), (2, 3.199, -0.124, 6.055), (2, 0.510, -0.622, 5.755), (2, 2.920, 1.067, 13.484), (2, 2.573, 1.844, 18.492), (2, 1.155, 3.505, 29.878), (2, 2.033, 1.756, 18.502), (2, 1.312, 0.114, 9.373), (2, -0.823, 3.339, 30.854), (2, 0.287, 3.891, 33.060), (2, -0.621, -0.210, 9.363), (2, 3.734, 1.574, 15.712), (2, -0.932, 0.772, 15.561), (2, -0.719, 1.604, 20.345), (2, -0.555, 0.773, 15.190), (2, -0.744, 3.934, 34.348), (2, 1.671, -0.425, 5.778), (2, 2.754, 2.690, 23.385), (2, 1.826, 2.185, 21.283), (2, 1.970, 0.021, 8.159), (2, 2.882, 3.494, 28.081), (2, 1.668, -0.030, 8.150), (2, 0.472, 2.184, 22.633), (2, 1.656, 3.393, 28.701), (2, -0.069, 2.331, 24.057), (2, 0.075, 1.341, 17.973), (2, 1.836, 0.565, 11.554), (2, -0.235, 0.520, 13.357), (2, 3.620, 3.169, 25.393), (2, 0.401, -0.062, 9.224), (2, 1.503, 1.667, 18.501), (2, 3.727, 1.149, 13.166), (2, 2.777, -0.081, 6.737), (2, 3.914, -0.234, 4.680), (2, 1.765, 0.750, 12.737), (2, 1.746, 1.818, 19.161), (2, 0.019, 2.819, 26.893), (2, 1.068, 1.917, 20.434), (2, 3.035, 3.158, 25.915), (2, 2.012, 0.724, 12.330), (2, 2.597, 2.264, 20.986), (2, 3.428, 3.239, 26.005), (2, -0.016, -0.529, 6.842), (2, 1.314, 0.735, 13.095), (2, 2.832, -0.567, 3.768), (2, -0.296, 2.641, 26.141), (2, 2.863, 3.889, 30.470), (2, 2.849, 3.997, 31.130), (2, 1.660, 1.813, 19.216), (2, 2.798, 0.977, 13.062), (2, 3.935, 0.549, 9.359), (2, 1.002, 3.557, 30.342), (2, 3.052, 2.207, 20.193), (2, 3.455, 0.458, 9.294), (2, 3.312, 2.138, 19.515), (2, 0.292, 0.058, 10.056), (2, 0.050, -0.211, 8.682), (2, -0.215, 1.108, 16.866), (2, -0.169, 0.647, 14.048), (2, 2.546, 0.876, 12.709), (2, -0.911, -0.209, 9.659), (2, 0.950, 2.894, 26.413), (2, -0.512, -0.167, 9.508), (2, 1.821, -0.747, 3.696), (2, 2.257, 3.945, 31.415), (2, 2.398, -0.586, 4.087), (2, 3.051, 0.815, 11.836), (2, 3.399, 2.131, 19.389), (2, 2.982, 1.549, 16.314), (2, -0.790, -0.329, 8.819), (2, 3.797, 0.327, 8.167), (2, 1.838, 0.290, 9.902), (2, 1.906, 1.782, 18.785), (2, 1.330, -0.208, 7.422), (2, -0.217, 0.854, 15.344), (2, 3.310, 1.582, 16.180), (2, 2.965, 0.917, 12.537), (2, 3.558, -0.164, 5.460), (2, -0.841, 2.060, 23.203), (2, 2.892, 2.621, 22.834), (2, -0.011, -0.198, 8.821), (2, -0.430, 2.999, 28.424), (2, -0.584, 0.894, 15.946), (2, 0.033, 1.310, 17.829), (2, 3.044, 0.410, 9.418), (2, 3.932, 0.295, 7.836), (2, 0.394, 1.315, 17.494), (2, 1.424, -0.167, 7.573), (2, 1.676, 1.118, 15.031), (2, 1.821, 0.714, 12.462), (2, 2.688, 1.497, 16.292), (2, 3.960, 2.344, 20.103), (2, -0.787, -0.161, 9.819), (2, 3.538, 3.651, 28.366), (2, -0.338, 0.458, 13.088), (2, -0.146, 3.162, 29.120), (2, 3.124, 3.352, 26.989), (2, -0.189, 3.685, 32.301), (2, 0.396, 1.004, 15.626), (2, -0.171, 2.114, 22.858), (2, 3.736, 0.732, 10.659), (2, 1.259, 2.564, 24.127), (2, -0.263, 2.426, 24.820), (2, 1.558, -0.858, 3.292), (2, 2.882, 1.110, 13.776), (2, 0.039, 1.284, 17.666), (2, 3.074, 2.379, 21.201), (2, -0.523, 0.303, 12.344), (2, 0.363, 1.082, 16.132), (2, 2.925, 2.187, 20.195), (2, 0.595, -0.335, 7.397), (2, 0.062, -0.232, 8.544), (2, 0.877, 2.155, 22.050), (2, -0.256, 2.922, 27.788), (2, 1.813, 3.161, 27.152), (2, 2.177, 2.532, 23.016), (2, -0.051, 0.035, 10.263), (2, 2.688, 3.599, 28.906), (2, 2.539, -0.076, 7.008), (2, 2.563, 1.467, 16.240), (2, -0.755, 2.276, 24.410), (2, 3.092, 0.660, 10.868), (2, 2.403, 2.693, 23.756), (2, -0.170, 2.178, 23.239), (2, 2.672, -0.603, 3.712), (2, -0.077, -0.493, 7.116), (2, 1.997, 1.934, 19.608), (2, 1.913, -0.792, 3.335), (2, 0.171, -0.329, 7.857), (2, 2.488, 0.171, 8.540), (2, -0.514, 0.331, 12.500), (2, -0.201, 2.484, 25.103), (2, 2.436, 0.032, 7.759), (2, -0.094, 2.530, 25.275), (2, 2.186, 2.591, 23.358), (2, 3.171, -0.766, 2.231), (2, 2.410, 0.183, 8.687), (2, -0.699, -0.329, 8.728), (2, 3.285, 2.252, 20.228), (2, 1.928, -0.059, 7.720), (2, 3.460, 0.399, 8.931), (2, 2.542, 0.224, 8.801), (2, 2.902, 2.101, 19.702), (2, 3.808, 2.528, 21.358), (2, 0.330, 0.642, 13.522), (2, -0.088, 1.286, 17.804), (2, 3.025, 2.354, 21.100), (2, 3.306, 2.049, 18.986), (2, 1.477, 1.720, 18.845), (2, 2.676, 3.601, 28.931), (2, 1.577, 0.170, 9.443), (2, 1.362, 3.534, 29.843), (2, 2.616, 3.106, 26.018), (2, 3.773, 0.378, 8.496), (2, -0.125, 2.057, 22.465), (2, 3.174, 1.382, 15.120), (2, 0.844, 2.058, 21.503);
 
 SELECT ANS[1] > -1.1 AND ANS[1] < -0.9 AND ANS[2] > 5.9 AND ANS[2] < 6.1 AND ANS[3] > 9.9 AND ANS[3] < 10.1 FROM
-(SELECT stochasticLinearRegression(0.05, 0, 1, 'SGD')(target, p1, p2) AS ANS FROM grouptest GROUP BY user_id LIMIT 0, 1);
+(SELECT stochasticLinearRegression(0.05, 0, 1, 'SGD')(target, p1, p2) AS ANS FROM grouptest GROUP BY user_id ORDER BY user_id LIMIT 1, 1);
 
 SELECT ANS[1] > 1.9 AND ANS[1] < 2.1 AND ANS[2] > 2.9 AND ANS[2] < 3.1 AND ANS[3] > -3.1 AND ANS[3] < -2.9 FROM
-(SELECT stochasticLinearRegression(0.05, 0, 1, 'SGD')(target, p1, p2) AS ANS FROM grouptest GROUP BY user_id LIMIT 1, 1);
+(SELECT stochasticLinearRegression(0.05, 0, 1, 'SGD')(target, p1, p2) AS ANS FROM grouptest GROUP BY user_id ORDER BY user_id LIMIT 0, 1);
 
 DROP TABLE defaults;
 DROP TABLE model;
diff --git a/tests/queries/0_stateless/00953_moving_functions.sql b/tests/queries/0_stateless/00953_moving_functions.sql
index daaceeeb3ac..b9046158a16 100644
--- a/tests/queries/0_stateless/00953_moving_functions.sql
+++ b/tests/queries/0_stateless/00953_moving_functions.sql
@@ -24,6 +24,10 @@ INSERT INTO moving_sum_num
 
 SELECT * FROM moving_sum_num ORDER BY k,dt FORMAT TabSeparatedWithNames;
 
+-- Result of function 'groupArrayMovingSum' depends on the order of merging
+-- aggregate states which is implementation defined in external aggregation.
+SET max_bytes_before_external_group_by = 0;
+
 SELECT k, groupArrayMovingSum(v) FROM (SELECT * FROM moving_sum_num ORDER BY k, dt) GROUP BY k ORDER BY k FORMAT TabSeparatedWithNamesAndTypes;
 SELECT k, groupArrayMovingSum(3)(v) FROM (SELECT * FROM moving_sum_num ORDER BY k, dt) GROUP BY k ORDER BY k FORMAT TabSeparatedWithNamesAndTypes;
 
diff --git a/tests/queries/0_stateless/00970_substring_arg_validation.reference b/tests/queries/0_stateless/00970_substring_arg_validation.reference
deleted file mode 100644
index 8b137891791..00000000000
--- a/tests/queries/0_stateless/00970_substring_arg_validation.reference
+++ /dev/null
@@ -1 +0,0 @@
-
diff --git a/tests/queries/0_stateless/00970_substring_arg_validation.sql b/tests/queries/0_stateless/00970_substring_arg_validation.sql
deleted file mode 100644
index 43d73bc2cda..00000000000
--- a/tests/queries/0_stateless/00970_substring_arg_validation.sql
+++ /dev/null
@@ -1,4 +0,0 @@
-SELECT substring('hello', []); -- { serverError 43 }
-SELECT substring('hello', 1, []); -- { serverError 43 }
-SELECT substring(materialize('hello'), -1, -1);
-SELECT substring(materialize('hello'), 0); -- { serverError 135 }
\ No newline at end of file
diff --git a/tests/queries/0_stateless/01012_reset_running_accumulate.sql b/tests/queries/0_stateless/01012_reset_running_accumulate.sql
index b9336b2f50c..c2c5bf6f87d 100644
--- a/tests/queries/0_stateless/01012_reset_running_accumulate.sql
+++ b/tests/queries/0_stateless/01012_reset_running_accumulate.sql
@@ -1,3 +1,6 @@
+-- Disable external aggregation because the state is reset for each new block of data in 'runningAccumulate' function.
+SET max_bytes_before_external_group_by = 0;
+
 SELECT grouping,
        item,
        runningAccumulate(state, grouping)
diff --git a/tests/queries/0_stateless/01033_function_substring.reference b/tests/queries/0_stateless/01033_function_substring.reference
new file mode 100644
index 00000000000..b0fac36e24a
--- /dev/null
+++ b/tests/queries/0_stateless/01033_function_substring.reference
@@ -0,0 +1,173 @@
+-- argument validation
+
+-- FixedString arguments
+hello\0\0\0
+hello\0\0\0
+0\0\0\0\0\0\0\0
+1\0\0\0\0\0\0\0
+2\0\0\0\0\0\0\0
+3\0\0\0\0\0\0\0
+4\0\0\0\0\0\0\0
+5\0\0\0\0\0\0\0
+6\0\0\0\0\0\0\0
+7\0\0\0\0\0\0\0
+8\0\0\0\0\0\0\0
+9\0\0\0\0\0\0\0
+995
+996
+997
+998
+999
+100
+100
+100
+100
+100
+
+9
+99
+998
+999\0
+
+1
+10
+100
+1004
+995\0
+96\0
+7\0
+\0
+
+1000
+001
+02
+3
+
+995
+9
+7\0
+\0
+
+10
+001
+0
+3
+
+-- Enum arguments
+hello	shark
+world	eagle
+ello	hark
+orld	agle
+o	k
+d	e
+lo	rk
+ld	le
+	
+	
+-- Constant enums
+f	fo
+-- negative offset argument
+abc
+abc
+abc
+bc
+c
+
+abc
+bc
+c
+
+abc
+abc
+abc
+bc
+c
+
+abc
+bc
+c
+
+abc
+abc
+abc
+bc
+c
+
+abc
+bc
+c
+
+abc
+abc
+abc
+bc
+c
+
+abc
+bc
+c
+
+lickhou
+lickhou
+lickhou
+lickhou
+lickhou
+lickhou
+lickhou
+lickhou
+-- negative length argument
+bcdef
+bcdef
+bcdef
+bcdef
+bcdef
+bcdef
+bcdef
+bcdef
+bcdef
+23456
+bcdef
+3456
+bcdef
+2345
+bcdef
+345
+bcdef
+23456
+bcdef
+3456
+bcdef
+2345
+bcdef
+345
+-- negative offset and size
+
+
+
+g
+g
+g
+
+
+
+g
+g
+g
+
+
+
+6
+
+
+
+
+-
+
+
+
+6
+
+
+
+
+UBSAN bug
diff --git a/tests/queries/0_stateless/01033_function_substring.sql b/tests/queries/0_stateless/01033_function_substring.sql
new file mode 100644
index 00000000000..82c6b5859e2
--- /dev/null
+++ b/tests/queries/0_stateless/01033_function_substring.sql
@@ -0,0 +1,146 @@
+SELECT '-- argument validation';
+
+SELECT substring('hello', []); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT substring('hello', 1, []); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
+SELECT substring(materialize('hello'), -1, -1);
+SELECT substring(materialize('hello'), 0); -- { serverError ZERO_ARRAY_OR_TUPLE_INDEX }
+
+SELECT '-- FixedString arguments';
+
+SELECT substring(toFixedString('hello', 16), 1, 8);
+SELECT substring(toFixedString(materialize('hello'), 16), 1, 8);
+SELECT substring(toFixedString(toString(number), 16), 1, 8) FROM system.numbers LIMIT 10;
+SELECT substring(toFixedString(toString(number), 4), 1, 3) FROM system.numbers LIMIT 995, 10;
+SELECT substring(toFixedString(toString(number), 4), 1, number % 5) FROM system.numbers LIMIT 995, 10;
+SELECT substring(toFixedString(toString(number), 4), 1 + number % 5) FROM system.numbers LIMIT 995, 10;
+SELECT substring(toFixedString(toString(number), 4), 1 + number % 5, 1 + number % 3) FROM system.numbers LIMIT 995, 10;
+
+SELECT '-- Enum arguments';
+
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab(e8 Enum8('hello' = -5, 'world' = 15), e16 Enum16('shark' = -999, 'eagle' = 9999)) ENGINE MergeTree ORDER BY tuple();
+INSERT INTO TABLE tab VALUES ('hello', 'shark'), ('world', 'eagle');
+
+-- positive offsets (slice from left)
+SELECT substring(e8, 1), substring (e16, 1) FROM tab;
+SELECT substring(e8, 2, 10), substring (e16, 2, 10) FROM tab;
+-- negative offsets (slice from right)
+SELECT substring(e8, -1), substring (e16, -1) FROM tab;
+SELECT substring(e8, -2, 10), substring (e16, -2, 10) FROM tab;
+-- zero offset/length
+SELECT substring(e8, 1, 0), substring (e16, 1, 0) FROM tab;
+
+SELECT '-- Constant enums';
+SELECT substring(CAST('foo', 'Enum8(\'foo\' = 1)'), 1, 1), substring(CAST('foo', 'Enum16(\'foo\' = 1111)'), 1, 2);
+
+DROP TABLE tab;
+
+SELECT '-- negative offset argument';
+
+SELECT substring('abc', number - 5) FROM system.numbers LIMIT 10;
+SELECT substring(materialize('abc'), number - 5) FROM system.numbers LIMIT 10;
+SELECT substring(toFixedString('abc', 3), number - 5) FROM system.numbers LIMIT 10;
+SELECT substring(materialize(toFixedString('abc', 3)), number - 5) FROM system.numbers LIMIT 10;
+
+SELECT substring('clickhouse', 2, -2);
+SELECT substring(materialize('clickhouse'), 2, -2);
+SELECT substring('clickhouse', materialize(2), -2);
+SELECT substring(materialize('clickhouse'), materialize(2), -2);
+SELECT substring('clickhouse', 2, materialize(-2));
+SELECT substring(materialize('clickhouse'), 2, materialize(-2));
+SELECT substring('clickhouse', materialize(2), materialize(-2));
+SELECT substring(materialize('clickhouse'), materialize(2), materialize(-2));
+
+SELECT '-- negative length argument';
+
+SELECT substring('abcdefgh', 2, -2);
+SELECT substring('abcdefgh', materialize(2), -2);
+SELECT substring('abcdefgh', 2, materialize(-2));
+SELECT substring('abcdefgh', materialize(2), materialize(-2));
+
+SELECT substring(cast('abcdefgh' AS FixedString(8)), 2, -2);
+SELECT substring(cast('abcdefgh' AS FixedString(8)), materialize(2), -2);
+SELECT substring(cast('abcdefgh' AS FixedString(8)), 2, materialize(-2));
+SELECT substring(cast('abcdefgh' AS FixedString(8)), materialize(2), materialize(-2));
+
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab (s String, l Int8, r Int8) ENGINE = Memory;
+INSERT INTO tab VALUES ('abcdefgh', 2, -2), ('12345678', 3, -3);
+
+SELECT substring(s, 2, -2) FROM tab;
+SELECT substring(s, l, -2) FROM tab;
+SELECT substring(s, 2, r) FROM tab;
+SELECT substring(s, l, r) FROM tab;
+
+DROP TABLE IF EXISTS tab;
+CREATE TABLE tab (s FixedString(8), l Int8, r Int8) ENGINE = Memory;
+INSERT INTO tab VALUES ('abcdefgh', 2, -2), ('12345678', 3, -3);
+
+SELECT substring(s, 2, -2) FROM tab;
+SELECT substring(s, l, -2) FROM tab;
+SELECT substring(s, 2, r) FROM tab;
+SELECT substring(s, l, r) FROM tab;
+
+DROP TABLE IF EXISTS tab;
+
+SELECT '-- negative offset and size';
+
+SELECT substring('abcdefgh', -2, -2);
+SELECT substring(materialize('abcdefgh'), -2, -2);
+SELECT substring(materialize('abcdefgh'), materialize(-2), materialize(-2));
+
+SELECT substring('abcdefgh', -2, -1);
+SELECT substring(materialize('abcdefgh'), -2, -1);
+SELECT substring(materialize('abcdefgh'), materialize(-2), materialize(-1));
+
+SELECT substring(cast('abcdefgh' AS FixedString(8)), -2, -2);
+SELECT substring(materialize(cast('abcdefgh' AS FixedString(8))), -2, -2);
+SELECT substring(materialize(cast('abcdefgh' AS FixedString(8))), materialize(-2), materialize(-2));
+
+SELECT substring(cast('abcdefgh' AS FixedString(8)), -2, -1);
+SELECT substring(materialize(cast('abcdefgh' AS FixedString(8))), -2, -1);
+SELECT substring(materialize(cast('abcdefgh' AS FixedString(8))), materialize(-2), materialize(-1));
+
+DROP TABLE IF EXISTS t;
+CREATE TABLE t
+(
+    s String,
+    l Int8,
+    r Int8
+) ENGINE = Memory;
+
+INSERT INTO t VALUES ('abcdefgh', -2, -2),('12345678', -3, -3);
+
+SELECT substring(s, -2, -2) FROM t;
+SELECT substring(s, l, -2) FROM t;
+SELECT substring(s, -2, r) FROM t;
+SELECT substring(s, l, r) FROM t;
+
+SELECT '-';
+DROP TABLE IF EXISTS t;
+CREATE TABLE t(
+                  s FixedString(8),
+                  l Int8,
+                  r Int8
+) engine = Memory;
+INSERT INTO t VALUES ('abcdefgh', -2, -2),('12345678', -3, -3);
+
+SELECT substring(s, -2, -2) FROM t;
+SELECT substring(s, l, -2) FROM t;
+SELECT substring(s, -2, r) FROM t;
+SELECT substring(s, l, r) FROM t;
+
+DROP table if exists t;
+
+SELECT 'UBSAN bug';
+
+/** NOTE: The behaviour of substring and substringUTF8 is inconsistent when negative offset is greater than string size:
+  * substring:
+  *      hello
+  * ^-----^ - offset -10, length 7, result: "he"
+  * substringUTF8:
+  *      hello
+  *      ^-----^ - offset -10, length 7, result: "hello"
+  * This may be subject for change.
+  */
+SELECT substringUTF8('hello, Ð¿Ñ�Ð¸Ð²ÐµÑ�', -9223372036854775808, number) FROM numbers(16) FORMAT Null;
diff --git a/tests/queries/0_stateless/01033_substr_negative_size_arg.reference b/tests/queries/0_stateless/01033_substr_negative_size_arg.reference
deleted file mode 100644
index db3a106ac7f..00000000000
--- a/tests/queries/0_stateless/01033_substr_negative_size_arg.reference
+++ /dev/null
@@ -1,8 +0,0 @@
-lickhou
-lickhou
-lickhou
-lickhou
-lickhou
-lickhou
-lickhou
-lickhou
diff --git a/tests/queries/0_stateless/01033_substr_negative_size_arg.sql b/tests/queries/0_stateless/01033_substr_negative_size_arg.sql
deleted file mode 100644
index a0fba1a6eee..00000000000
--- a/tests/queries/0_stateless/01033_substr_negative_size_arg.sql
+++ /dev/null
@@ -1,8 +0,0 @@
-SELECT substr('clickhouse', 2, -2);
-SELECT substr(materialize('clickhouse'), 2, -2);
-SELECT substr('clickhouse', materialize(2), -2);
-SELECT substr(materialize('clickhouse'), materialize(2), -2);
-SELECT substr('clickhouse', 2, materialize(-2));
-SELECT substr(materialize('clickhouse'), 2, materialize(-2));
-SELECT substr('clickhouse', materialize(2), materialize(-2));
-SELECT substr(materialize('clickhouse'), materialize(2), materialize(-2));
diff --git a/tests/queries/0_stateless/01035_avg_weighted_long.sh b/tests/queries/0_stateless/01035_avg_weighted_long.sh
index 0e76d6e328d..92c86981b37 100755
--- a/tests/queries/0_stateless/01035_avg_weighted_long.sh
+++ b/tests/queries/0_stateless/01035_avg_weighted_long.sh
@@ -28,7 +28,7 @@ exttypes=("Int128" "Int256" "UInt256")
             echo "SELECT avgWeighted(to${left}(1), to${right}(2));"
         done
     done
-) | clickhouse-client -nm
+) | $CLICKHOUSE_CLIENT_BINARY -nm
 
-echo "$(${CLICKHOUSE_CLIENT} --server_logs_file=/dev/null --query="SELECT avgWeighted(['string'], toFloat64(0))" 2>&1)" \
+${CLICKHOUSE_CLIENT} --server_logs_file=/dev/null --query="SELECT avgWeighted(['string'], toFloat64(0))" 2>&1 \
   | grep -c 'Code: 43. DB::Exception: .* DB::Exception:.* Types .* are non-conforming as arguments for aggregate function avgWeighted'
diff --git a/tests/queries/0_stateless/01051_system_stack_trace.reference b/tests/queries/0_stateless/01051_system_stack_trace.reference
deleted file mode 100644
index 29f6990e6b4..00000000000
--- a/tests/queries/0_stateless/01051_system_stack_trace.reference
+++ /dev/null
@@ -1,18 +0,0 @@
--- { echo }
-SELECT count() > 0 FROM system.stack_trace WHERE query_id != '' AND thread_name = 'TCPHandler';
-1
--- opimization for not reading /proc/self/task/{}/comm and avoid sending signal
-SELECT countIf(thread_id > 0) > 0 FROM system.stack_trace;
-1
--- optimization for trace
-SELECT length(trace) > 0 FROM system.stack_trace WHERE length(trace) > 0 LIMIT 1;
-1
--- optimization for query_id
-SELECT length(query_id) > 0 FROM system.stack_trace WHERE query_id != '' AND thread_name = 'TCPHandler' LIMIT 1;
-1
--- optimization for thread_name
-SELECT length(thread_name) > 0 FROM system.stack_trace WHERE thread_name != '' LIMIT 1;
-1
--- enough rows (optimizations works "correctly")
-SELECT count() > 100 FROM system.stack_trace;
-1
diff --git a/tests/queries/0_stateless/01051_system_stack_trace.sql b/tests/queries/0_stateless/01051_system_stack_trace.sql
deleted file mode 100644
index 93cc5763f19..00000000000
--- a/tests/queries/0_stateless/01051_system_stack_trace.sql
+++ /dev/null
@@ -1,24 +0,0 @@
--- Tags: no-parallel
--- Tag no-parallel: to decrease failure probability of collecting stack traces
-
--- Process one thread at a time
-SET max_block_size = 1;
-
--- It is OK to have bigger timeout here since:
--- a) this test is marked as no-parallel
--- b) there is a filter by thread_name, so it will send signals only to the threads with the name TCPHandler
--- c) max_block_size is 1
-SET storage_system_stack_trace_pipe_read_timeout_ms = 5000;
-
--- { echo }
-SELECT count() > 0 FROM system.stack_trace WHERE query_id != '' AND thread_name = 'TCPHandler';
--- opimization for not reading /proc/self/task/{}/comm and avoid sending signal
-SELECT countIf(thread_id > 0) > 0 FROM system.stack_trace;
--- optimization for trace
-SELECT length(trace) > 0 FROM system.stack_trace WHERE length(trace) > 0 LIMIT 1;
--- optimization for query_id
-SELECT length(query_id) > 0 FROM system.stack_trace WHERE query_id != '' AND thread_name = 'TCPHandler' LIMIT 1;
--- optimization for thread_name
-SELECT length(thread_name) > 0 FROM system.stack_trace WHERE thread_name != '' LIMIT 1;
--- enough rows (optimizations works "correctly")
-SELECT count() > 100 FROM system.stack_trace;
diff --git a/tests/queries/0_stateless/01053_ssd_dictionary.sh b/tests/queries/0_stateless/01053_ssd_dictionary.sh
index cf1a55b2942..b49144c9b1a 100755
--- a/tests/queries/0_stateless/01053_ssd_dictionary.sh
+++ b/tests/queries/0_stateless/01053_ssd_dictionary.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT --allow_deprecated_database_ordinary=1 -n --query="
   DROP DATABASE IF EXISTS 01053_db;
diff --git a/tests/queries/0_stateless/01060_substring_negative_size.reference b/tests/queries/0_stateless/01060_substring_negative_size.reference
deleted file mode 100644
index b25696dc7d6..00000000000
--- a/tests/queries/0_stateless/01060_substring_negative_size.reference
+++ /dev/null
@@ -1,27 +0,0 @@
-bcdef
-bcdef
-bcdef
-bcdef
--
-bcdef
-bcdef
-bcdef
-bcdef
--
-bcdef
-23456
-bcdef
-3456
-bcdef
-2345
-bcdef
-345
--
-bcdef
-23456
-bcdef
-3456
-bcdef
-2345
-bcdef
-345
diff --git a/tests/queries/0_stateless/01060_substring_negative_size.sql b/tests/queries/0_stateless/01060_substring_negative_size.sql
deleted file mode 100644
index 23cab14a6e0..00000000000
--- a/tests/queries/0_stateless/01060_substring_negative_size.sql
+++ /dev/null
@@ -1,36 +0,0 @@
-select substring('abcdefgh', 2, -2);
-select substring('abcdefgh', materialize(2), -2);
-select substring('abcdefgh', 2, materialize(-2));
-select substring('abcdefgh', materialize(2), materialize(-2));
-
-select '-';
-
-select substring(cast('abcdefgh' as FixedString(8)), 2, -2);
-select substring(cast('abcdefgh' as FixedString(8)), materialize(2), -2);
-select substring(cast('abcdefgh' as FixedString(8)), 2, materialize(-2));
-select substring(cast('abcdefgh' as FixedString(8)), materialize(2), materialize(-2));
-
-select '-';
-
-drop table if exists t;
-create table t (s String, l Int8, r Int8) engine = Memory;
-insert into t values ('abcdefgh', 2, -2), ('12345678', 3, -3);
-
-select substring(s, 2, -2) from t;
-select substring(s, l, -2) from t;
-select substring(s, 2, r) from t;
-select substring(s, l, r) from t;
-
-select '-';
-
-drop table if exists t;
-create table t (s FixedString(8), l Int8, r Int8) engine = Memory;
-insert into t values ('abcdefgh', 2, -2), ('12345678', 3, -3);
-
-select substring(s, 2, -2) from t;
-select substring(s, l, -2) from t;
-select substring(s, 2, r) from t;
-select substring(s, l, r) from t;
-
-drop table if exists t;
-
diff --git a/tests/queries/0_stateless/01064_incremental_streaming_from_2_src_with_feedback.sql b/tests/queries/0_stateless/01064_incremental_streaming_from_2_src_with_feedback.sql
index 3d75fb0ccc9..ae90dc3cc72 100644
--- a/tests/queries/0_stateless/01064_incremental_streaming_from_2_src_with_feedback.sql
+++ b/tests/queries/0_stateless/01064_incremental_streaming_from_2_src_with_feedback.sql
@@ -1,5 +1,8 @@
 SET joined_subquery_requires_alias = 0;
 SET max_threads = 1;
+-- It affects number of read rows and max_rows_to_read.
+SET max_bytes_before_external_sort = 0;
+SET max_bytes_before_external_group_by = 0;
 
 -- incremental streaming usecase
 -- that has sense only if data filling order has guarantees of chronological order
diff --git a/tests/queries/0_stateless/01070_alter_with_ttl.sql b/tests/queries/0_stateless/01070_alter_with_ttl.sql
index 3adc3ccd6ae..44d422cbe6d 100644
--- a/tests/queries/0_stateless/01070_alter_with_ttl.sql
+++ b/tests/queries/0_stateless/01070_alter_with_ttl.sql
@@ -1,5 +1,7 @@
 drop table if exists alter_ttl;
 
+SET allow_suspicious_ttl_expressions = 1;
+
 create table alter_ttl(i Int) engine = MergeTree order by i ttl toDate('2020-05-05');
 alter table alter_ttl add column s String;
 alter table alter_ttl modify column s String ttl toDate('2020-01-01');
diff --git a/tests/queries/0_stateless/01070_materialize_ttl.sql b/tests/queries/0_stateless/01070_materialize_ttl.sql
index b6a03f2ca10..b322b67882c 100644
--- a/tests/queries/0_stateless/01070_materialize_ttl.sql
+++ b/tests/queries/0_stateless/01070_materialize_ttl.sql
@@ -1,5 +1,7 @@
 -- Tags: no-parallel
 
+SET allow_suspicious_ttl_expressions = 1;
+
 drop table if exists ttl;
 
 create table ttl (d Date, a Int) engine = MergeTree order by a partition by toDayOfMonth(d);
diff --git a/tests/queries/0_stateless/01070_modify_ttl.sql b/tests/queries/0_stateless/01070_modify_ttl.sql
index 0716ccd7043..4ffd59fc8a9 100644
--- a/tests/queries/0_stateless/01070_modify_ttl.sql
+++ b/tests/queries/0_stateless/01070_modify_ttl.sql
@@ -1,5 +1,7 @@
 -- Tags: no-parallel
 
+SET allow_suspicious_ttl_expressions = 1;
+
 drop table if exists ttl;
 
 create table ttl (d Date, a Int) engine = MergeTree order by a partition by toDayOfMonth(d);
diff --git a/tests/queries/0_stateless/01070_modify_ttl_recalc_only.sql b/tests/queries/0_stateless/01070_modify_ttl_recalc_only.sql
index 7ac70d41871..2700cc03ff5 100644
--- a/tests/queries/0_stateless/01070_modify_ttl_recalc_only.sql
+++ b/tests/queries/0_stateless/01070_modify_ttl_recalc_only.sql
@@ -5,6 +5,8 @@ set mutations_sync = 2;
 -- system.parts has server default, timezone cannot be randomized
 set session_timezone = '';
 
+SET allow_suspicious_ttl_expressions = 1;
+
 drop table if exists ttl;
 
 create table ttl (d Date, a Int) engine = MergeTree order by a partition by toDayOfMonth(d)
diff --git a/tests/queries/0_stateless/01070_mutations_with_dependencies.sql b/tests/queries/0_stateless/01070_mutations_with_dependencies.sql
index 566bb16b10c..813ebf3f5a7 100644
--- a/tests/queries/0_stateless/01070_mutations_with_dependencies.sql
+++ b/tests/queries/0_stateless/01070_mutations_with_dependencies.sql
@@ -34,6 +34,8 @@ select count() from ttl where s = 'b';
 drop table ttl;
 
 -- check only that it doesn't throw exceptions.
+SET allow_suspicious_ttl_expressions = 1;
+
 create table ttl (i Int, s String) engine = MergeTree order by i ttl toDate('2000-01-01') TO DISK 'default';
 alter table ttl materialize ttl;
 drop table ttl;
diff --git a/tests/queries/0_stateless/01088_array_slice_of_aggregate_functions.sql b/tests/queries/0_stateless/01088_array_slice_of_aggregate_functions.sql
index ba525f30228..c8466b57051 100644
--- a/tests/queries/0_stateless/01088_array_slice_of_aggregate_functions.sql
+++ b/tests/queries/0_stateless/01088_array_slice_of_aggregate_functions.sql
@@ -1 +1 @@
-select arraySlice(groupArray(x),1,1) as y from (select uniqState(number) as x from numbers(10) group by number);
+select arraySlice(groupArray(x), 1, 1) as y from (select uniqState(number) as x from numbers(10) group by number order by number);
diff --git a/tests/queries/0_stateless/01090_zookeeper_mutations_and_insert_quorum_long.sql b/tests/queries/0_stateless/01090_zookeeper_mutations_and_insert_quorum_long.sql
index db6555e593e..67534a4611e 100644
--- a/tests/queries/0_stateless/01090_zookeeper_mutations_and_insert_quorum_long.sql
+++ b/tests/queries/0_stateless/01090_zookeeper_mutations_and_insert_quorum_long.sql
@@ -9,7 +9,6 @@ CREATE TABLE mutations_and_quorum2 (`server_date` Date, `something` String) ENGI
 
 -- Should not be larger then 600e6 (default timeout in clickhouse-test)
 SET insert_quorum=2, insert_quorum_parallel=0, insert_quorum_timeout=300e3;
-SET insert_keeper_fault_injection_probability=0;
 
 INSERT INTO mutations_and_quorum1 VALUES ('2019-01-01', 'test1'), ('2019-02-01', 'test2'), ('2019-03-01', 'test3'), ('2019-04-01', 'test4'), ('2019-05-01', 'test1'), ('2019-06-01', 'test2'), ('2019-07-01', 'test3'), ('2019-08-01', 'test4'), ('2019-09-01', 'test1'), ('2019-10-01', 'test2'), ('2019-11-01', 'test3'), ('2019-12-01', 'test4');
 
diff --git a/tests/queries/0_stateless/01098_msgpack_format.sh b/tests/queries/0_stateless/01098_msgpack_format.sh
index 24638f33324..e2ae026eb27 100755
--- a/tests/queries/0_stateless/01098_msgpack_format.sh
+++ b/tests/queries/0_stateless/01098_msgpack_format.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 
 $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS msgpack";
@@ -128,4 +128,3 @@ $CLICKHOUSE_CLIENT --query="SELECT * FROM file('data.msgpack', 'MsgPack', 'x Arr
 
 
 rm $USER_FILES_PATH/data.msgpack
-
diff --git a/tests/queries/0_stateless/01104_distributed_numbers_test.reference b/tests/queries/0_stateless/01104_distributed_numbers_test.reference
index c5079fa2cfd..c7e52eb2a2f 100644
--- a/tests/queries/0_stateless/01104_distributed_numbers_test.reference
+++ b/tests/queries/0_stateless/01104_distributed_numbers_test.reference
@@ -2,3 +2,6 @@
 100
 100
 100
+300
+100
+100
diff --git a/tests/queries/0_stateless/01104_distributed_numbers_test.sql b/tests/queries/0_stateless/01104_distributed_numbers_test.sql
index bb2db88f23f..07237223bad 100644
--- a/tests/queries/0_stateless/01104_distributed_numbers_test.sql
+++ b/tests/queries/0_stateless/01104_distributed_numbers_test.sql
@@ -1,9 +1,25 @@
 -- Tags: distributed
 
+SELECT *
+FROM
+(
+    SELECT *
+    FROM system.numbers
+    WHERE number = 100
+    UNION ALL
+    SELECT *
+    FROM system.numbers
+    WHERE number = 100
+)
+LIMIT 2
+SETTINGS max_threads = 1 FORMAT Null;
+
 DROP TABLE IF EXISTS d_numbers;
 CREATE TABLE d_numbers (number UInt32) ENGINE = Distributed(test_cluster_two_shards, system, numbers, rand());
 
 SELECT '100' AS number FROM d_numbers AS n WHERE n.number = 100 LIMIT 2;
+SELECT '100' AS number FROM d_numbers AS n WHERE n.number = 100 LIMIT 2 SETTINGS max_threads = 1, prefer_localhost_replica=1;
+SELECT sum(number) FROM (select * from remote('127.0.0.{1,1,1}', system.numbers) AS n WHERE n.number = 100 LIMIT 3) SETTINGS max_threads = 2, prefer_localhost_replica=1;
 
 SET distributed_product_mode = 'local';
 
diff --git a/tests/queries/0_stateless/01134_max_rows_to_group_by.sql b/tests/queries/0_stateless/01134_max_rows_to_group_by.sql
index bfbc499e1c3..f9ea37cb65a 100644
--- a/tests/queries/0_stateless/01134_max_rows_to_group_by.sql
+++ b/tests/queries/0_stateless/01134_max_rows_to_group_by.sql
@@ -2,6 +2,9 @@ SET max_block_size = 1;
 SET max_rows_to_group_by = 10;
 SET group_by_overflow_mode = 'throw';
 
+-- Settings 'max_rows_to_group_by' and 'max_bytes_before_external_group_by' are mutually exclusive.
+SET max_bytes_before_external_group_by = 0;
+
 SELECT 'test1', number FROM system.numbers GROUP BY number; -- { serverError 158 }
 
 SET group_by_overflow_mode = 'break';
diff --git a/tests/queries/0_stateless/01162_strange_mutations.sh b/tests/queries/0_stateless/01162_strange_mutations.sh
index eea9ea5f7e5..f2428141264 100755
--- a/tests/queries/0_stateless/01162_strange_mutations.sh
+++ b/tests/queries/0_stateless/01162_strange_mutations.sh
@@ -1,4 +1,6 @@
 #!/usr/bin/env bash
+# Tags: no-replicated-database
+# Tag no-replicated-database: CREATE AS SELECT is disabled
 
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
diff --git a/tests/queries/0_stateless/01193_metadata_loading.sh b/tests/queries/0_stateless/01193_metadata_loading.sh
index 50425eae018..c25cdf4e970 100755
--- a/tests/queries/0_stateless/01193_metadata_loading.sh
+++ b/tests/queries/0_stateless/01193_metadata_loading.sh
@@ -29,7 +29,7 @@ create_tables() {
           groupArray(
               create1 || toString(number) || create2 || engines[1 + number % length(engines)] || ';\n' ||
               insert1 ||  toString(number) || insert2
-          ), ';\n') FROM numbers($tables) FORMAT TSVRaw;" | $CLICKHOUSE_CLIENT -nm
+          ), ';\n') FROM numbers($tables) SETTINGS max_bytes_before_external_group_by = 0 FORMAT TSVRaw;" | $CLICKHOUSE_CLIENT -nm
 }
 
 $CLICKHOUSE_CLIENT -q "CREATE DATABASE $db"
diff --git a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
index 291910ed43f..0d24b238d64 100644
--- a/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
+++ b/tests/queries/0_stateless/01244_optimize_distributed_group_by_sharding_key.sql
@@ -4,6 +4,9 @@
 
 set optimize_distributed_group_by_sharding_key=1;
 
+-- Some queries in this test require sorting after aggregation.
+set max_bytes_before_external_group_by = 0;
+
 drop table if exists dist_01247;
 drop table if exists data_01247;
 
diff --git a/tests/queries/0_stateless/01271_show_privileges.reference b/tests/queries/0_stateless/01271_show_privileges.reference
index 6c639926aac..1a3a271528c 100644
--- a/tests/queries/0_stateless/01271_show_privileges.reference
+++ b/tests/queries/0_stateless/01271_show_privileges.reference
@@ -48,6 +48,7 @@ ALTER TABLE	[]	\N	ALTER
 ALTER DATABASE	[]	\N	ALTER
 ALTER VIEW REFRESH	['ALTER LIVE VIEW REFRESH','REFRESH VIEW']	VIEW	ALTER VIEW
 ALTER VIEW MODIFY QUERY	['ALTER TABLE MODIFY QUERY']	VIEW	ALTER VIEW
+ALTER VIEW MODIFY REFRESH	['ALTER TABLE MODIFY QUERY']	VIEW	ALTER VIEW
 ALTER VIEW	[]	\N	ALTER
 ALTER	[]	\N	ALL
 CREATE DATABASE	[]	DATABASE	CREATE
@@ -127,12 +128,14 @@ SYSTEM FETCHES	['SYSTEM STOP FETCHES','SYSTEM START FETCHES','STOP FETCHES','STA
 SYSTEM MOVES	['SYSTEM STOP MOVES','SYSTEM START MOVES','STOP MOVES','START MOVES']	TABLE	SYSTEM
 SYSTEM PULLING REPLICATION LOG	['SYSTEM STOP PULLING REPLICATION LOG','SYSTEM START PULLING REPLICATION LOG']	TABLE	SYSTEM
 SYSTEM CLEANUP	['SYSTEM STOP CLEANUP','SYSTEM START CLEANUP']	TABLE	SYSTEM
+SYSTEM VIEWS	['SYSTEM REFRESH VIEW','SYSTEM START VIEWS','SYSTEM STOP VIEWS','SYSTEM START VIEW','SYSTEM STOP VIEW','SYSTEM CANCEL VIEW','REFRESH VIEW','START VIEWS','STOP VIEWS','START VIEW','STOP VIEW','CANCEL VIEW']	VIEW	SYSTEM
 SYSTEM DISTRIBUTED SENDS	['SYSTEM STOP DISTRIBUTED SENDS','SYSTEM START DISTRIBUTED SENDS','STOP DISTRIBUTED SENDS','START DISTRIBUTED SENDS']	TABLE	SYSTEM SENDS
 SYSTEM REPLICATED SENDS	['SYSTEM STOP REPLICATED SENDS','SYSTEM START REPLICATED SENDS','STOP REPLICATED SENDS','START REPLICATED SENDS']	TABLE	SYSTEM SENDS
 SYSTEM SENDS	['SYSTEM STOP SENDS','SYSTEM START SENDS','STOP SENDS','START SENDS']	\N	SYSTEM
 SYSTEM REPLICATION QUEUES	['SYSTEM STOP REPLICATION QUEUES','SYSTEM START REPLICATION QUEUES','STOP REPLICATION QUEUES','START REPLICATION QUEUES']	TABLE	SYSTEM
 SYSTEM DROP REPLICA	['DROP REPLICA']	TABLE	SYSTEM
 SYSTEM SYNC REPLICA	['SYNC REPLICA']	TABLE	SYSTEM
+SYSTEM REPLICA READINESS	['SYSTEM REPLICA READY','SYSTEM REPLICA UNREADY']	GLOBAL	SYSTEM
 SYSTEM RESTART REPLICA	['RESTART REPLICA']	TABLE	SYSTEM
 SYSTEM RESTORE REPLICA	['RESTORE REPLICA']	TABLE	SYSTEM
 SYSTEM WAIT LOADING PARTS	['WAIT LOADING PARTS']	TABLE	SYSTEM
diff --git a/tests/queries/0_stateless/01280_ssd_complex_key_dictionary.sh b/tests/queries/0_stateless/01280_ssd_complex_key_dictionary.sh
index 28e8e8386cf..fb7bf5c6fc1 100755
--- a/tests/queries/0_stateless/01280_ssd_complex_key_dictionary.sh
+++ b/tests/queries/0_stateless/01280_ssd_complex_key_dictionary.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT -n --query="
     set allow_deprecated_database_ordinary=1;
diff --git a/tests/queries/0_stateless/01291_distributed_low_cardinality_memory_efficient.sql b/tests/queries/0_stateless/01291_distributed_low_cardinality_memory_efficient.sql
index 267f5585705..3697a167989 100644
--- a/tests/queries/0_stateless/01291_distributed_low_cardinality_memory_efficient.sql
+++ b/tests/queries/0_stateless/01291_distributed_low_cardinality_memory_efficient.sql
@@ -6,7 +6,12 @@ DROP TABLE IF EXISTS dist;
 create table data (key String) Engine=Memory();
 create table dist (key LowCardinality(String)) engine=Distributed(test_cluster_two_shards, currentDatabase(), data);
 insert into data values ('foo');
+
 set distributed_aggregation_memory_efficient=1;
+
+-- There is an obscure bug in rare corner case.
+set max_bytes_before_external_group_by = 0;
+
 select * from dist group by key;
 
 DROP TABLE data;
diff --git a/tests/queries/0_stateless/01300_group_by_other_keys_having.sql b/tests/queries/0_stateless/01300_group_by_other_keys_having.sql
index 911f61a62e2..203e8322ad9 100644
--- a/tests/queries/0_stateless/01300_group_by_other_keys_having.sql
+++ b/tests/queries/0_stateless/01300_group_by_other_keys_having.sql
@@ -1,4 +1,5 @@
 set optimize_group_by_function_keys = 1;
+set optimize_syntax_fuse_functions = 0;
 set allow_experimental_analyzer = 1;
 
 -- { echoOn }
diff --git a/tests/queries/0_stateless/01357_version_collapsing_attach_detach_zookeeper.reference b/tests/queries/0_stateless/01357_version_collapsing_attach_detach_zookeeper.reference
index 353c70aec11..41609184a74 100644
--- a/tests/queries/0_stateless/01357_version_collapsing_attach_detach_zookeeper.reference
+++ b/tests/queries/0_stateless/01357_version_collapsing_attach_detach_zookeeper.reference
@@ -1,3 +1,3 @@
-metadata format version: 1\ndate column: \nsampling expression: \nindex granularity: 8192\nmode: 7\nsign column: sign\nprimary key: key1, key2\ndata format version: 1\npartition key: d\ngranularity bytes: 10485760\n
+metadata format version: 1\ndate column: \nsampling expression: \nindex granularity: 8192\nmode: 7\nsign column: sign\nprimary key: key1, key2\ndata format version: 1\npartition key: d\ngranularity bytes: 10485760\nmerge parameters format version: 2\nversion column: version\n
 1
 1
diff --git a/tests/queries/0_stateless/01417_freeze_partition_verbose_zookeeper.sh b/tests/queries/0_stateless/01417_freeze_partition_verbose_zookeeper.sh
index 1fd8a2b29c6..bf97a8e4f9d 100755
--- a/tests/queries/0_stateless/01417_freeze_partition_verbose_zookeeper.sh
+++ b/tests/queries/0_stateless/01417_freeze_partition_verbose_zookeeper.sh
@@ -13,7 +13,7 @@ FREEZE_OUT_STRUCTURE='backup_name String, backup_path String , part_backup_path
 # setup
 
 ${CLICKHOUSE_CLIENT} --query "DROP TABLE IF EXISTS table_for_freeze_replicated SYNC;"
-${CLICKHOUSE_CLIENT} --query "CREATE TABLE table_for_freeze_replicated (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/table_for_freeze_replicated', '1') ORDER BY key PARTITION BY key % 10;"
+${CLICKHOUSE_CLIENT} --query "CREATE TABLE table_for_freeze_replicated (key UInt64, value String) ENGINE = ReplicatedMergeTree('/test/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/table_for_freeze_replicated', '1') ORDER BY key PARTITION BY key % 10 SETTINGS disable_freeze_partition_for_zero_copy_replication=0;"
 ${CLICKHOUSE_CLIENT} --insert_keeper_fault_injection_probability=0 --query "INSERT INTO table_for_freeze_replicated SELECT number, toString(number) from numbers(10);"
 
 ${CLICKHOUSE_CLIENT} --query "ALTER TABLE table_for_freeze_replicated FREEZE WITH NAME 'test_01417' FORMAT TSVWithNames SETTINGS alter_partition_verbose_result = 1;" \
diff --git a/tests/queries/0_stateless/01451_replicated_detach_drop_and_quorum_long.sql b/tests/queries/0_stateless/01451_replicated_detach_drop_and_quorum_long.sql
index eea231c9f58..21b65995482 100644
--- a/tests/queries/0_stateless/01451_replicated_detach_drop_and_quorum_long.sql
+++ b/tests/queries/0_stateless/01451_replicated_detach_drop_and_quorum_long.sql
@@ -1,6 +1,5 @@
 -- Tags: long, replica, no-replicated-database
 
-SET insert_keeper_fault_injection_probability=0; -- disable fault injection; part ids are non-deterministic in case of insert retries
 SET replication_alter_partitions_sync = 2;
 
 
@@ -10,7 +9,7 @@ DROP TABLE IF EXISTS replica2;
 CREATE TABLE replica1 (v UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/01451/quorum', 'r1') order by tuple() settings max_replicated_merges_in_queue = 0;
 CREATE TABLE replica2 (v UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/test/01451/quorum', 'r2') order by tuple() settings max_replicated_merges_in_queue = 0;
 
-INSERT INTO replica1 VALUES (0);
+INSERT INTO replica1 SETTINGS insert_keeper_fault_injection_probability=0 VALUES (0);
 
 SYSTEM SYNC REPLICA replica2;
 
@@ -27,7 +26,7 @@ ALTER TABLE replica2 DROP PARTITION ID 'all';
 
 SET insert_quorum = 2, insert_quorum_parallel = 0;
 
-INSERT INTO replica2 VALUES (1);
+INSERT INTO replica2 SETTINGS insert_keeper_fault_injection_probability=0 VALUES (1);
 
 SYSTEM SYNC REPLICA replica2;
 
@@ -39,7 +38,7 @@ SELECT COUNT() FROM replica1;
 
 SET insert_quorum_parallel=1;
 
-INSERT INTO replica2 VALUES (2);
+INSERT INTO replica2 SETTINGS insert_keeper_fault_injection_probability=0 VALUES (2);
 
 -- should work, parallel quorum nodes exists only during insert
 ALTER TABLE replica1 DROP PART 'all_3_3_0';
diff --git a/tests/queries/0_stateless/01451_replicated_detach_drop_part_long.sql b/tests/queries/0_stateless/01451_replicated_detach_drop_part_long.sql
index bf7a471fa40..25b2923ddd9 100644
--- a/tests/queries/0_stateless/01451_replicated_detach_drop_part_long.sql
+++ b/tests/queries/0_stateless/01451_replicated_detach_drop_part_long.sql
@@ -1,7 +1,6 @@
 -- Tags: long, replica, no-replicated-database
 -- Tag no-replicated-database: Fails due to additional replicas or shards
 
-SET insert_keeper_fault_injection_probability=0; -- disable fault injection; part ids are non-deterministic in case of insert retries
 SET replication_alter_partitions_sync = 2;
 
 DROP TABLE IF EXISTS replica1 SYNC;
@@ -10,9 +9,9 @@ DROP TABLE IF EXISTS replica2 SYNC;
 CREATE TABLE replica1 (v UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/'||currentDatabase()||'test/01451/attach', 'r1') order by tuple() settings max_replicated_merges_in_queue = 0;
 CREATE TABLE replica2 (v UInt8) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/'||currentDatabase()||'test/01451/attach', 'r2') order by tuple() settings max_replicated_merges_in_queue = 0;
 
-INSERT INTO replica1 VALUES (0);
-INSERT INTO replica1 VALUES (1);
-INSERT INTO replica1 VALUES (2);
+INSERT INTO replica1 SETTINGS insert_keeper_fault_injection_probability=0 VALUES (0);
+INSERT INTO replica1 SETTINGS insert_keeper_fault_injection_probability=0 VALUES (1);
+INSERT INTO replica1 SETTINGS insert_keeper_fault_injection_probability=0 VALUES (2);
 
 ALTER TABLE replica1 DETACH PART 'all_100_100_0'; -- { serverError 232 }
 
@@ -25,7 +24,7 @@ SELECT v FROM replica1 ORDER BY v;
 
 SELECT name FROM system.detached_parts WHERE table = 'replica2' AND database = currentDatabase();
 
-ALTER TABLE replica2 ATTACH PART 'all_1_1_0';
+ALTER TABLE replica2 ATTACH PART 'all_1_1_0' SETTINGS insert_keeper_fault_injection_probability=0;
 
 SYSTEM SYNC REPLICA replica1;
 SELECT v FROM replica1 ORDER BY v;
diff --git a/tests/queries/0_stateless/01459_manual_write_to_replicas.sh b/tests/queries/0_stateless/01459_manual_write_to_replicas.sh
index c05d813ca7f..a9a6d27c145 100755
--- a/tests/queries/0_stateless/01459_manual_write_to_replicas.sh
+++ b/tests/queries/0_stateless/01459_manual_write_to_replicas.sh
@@ -20,10 +20,6 @@ function thread {
     for x in {0..99}; do
         # sometimes we can try to commit obsolete part if fetches will be quite fast,
         # so supress warning messages like "Tried to commit obsolete part ... covered by ..."
-        # (2) keeper fault injection for inserts because
-        #     it can be a cause of deduplicated parts be visible to SELECTs for sometime (until cleanup thread remove them),
-        #     so the same SELECT on different replicas can return different results, i.e. test output will be non-deterministic
-        #     (see #9712)
         $CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0 --query "INSERT INTO r$1 SELECT $x % $NUM_REPLICAS = $1 ? $x - 1 : $x" 2>/dev/null  # Replace some records as duplicates so they will be written by other replicas
     done
 }
diff --git a/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum_detach_attach.sh b/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum_detach_attach.sh
index 01c88336282..1f76a2efc6b 100755
--- a/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum_detach_attach.sh
+++ b/tests/queries/0_stateless/01459_manual_write_to_replicas_quorum_detach_attach.sh
@@ -24,7 +24,7 @@ function thread {
         while true; do
             $CLICKHOUSE_CLIENT --query "DETACH TABLE r$1"
             $CLICKHOUSE_CLIENT --query "ATTACH TABLE r$1"
-            $CLICKHOUSE_CLIENT --insert_quorum 3 --insert_quorum_parallel 0 --insert_keeper_fault_injection_probability=0 --query "INSERT INTO r$1 SELECT $x" 2>&1 | grep -qE "$valid_exceptions_to_retry" || break
+            $CLICKHOUSE_CLIENT --insert_quorum 3 --insert_quorum_parallel 0 --query "INSERT INTO r$1 SELECT $x" 2>&1 | grep -qE "$valid_exceptions_to_retry" || break
         done
     done
 }
diff --git a/tests/queries/0_stateless/01472_many_rows_in_totals.sql b/tests/queries/0_stateless/01472_many_rows_in_totals.sql
index d79d189a28d..bea8c255f21 100644
--- a/tests/queries/0_stateless/01472_many_rows_in_totals.sql
+++ b/tests/queries/0_stateless/01472_many_rows_in_totals.sql
@@ -1,4 +1,7 @@
+-- Disable external aggregation because it may produce several blocks instead of one.
+set max_bytes_before_external_group_by = 0;
 set output_format_write_statistics = 0;
+
 select g, s from (select g, sum(number) as s from numbers(4) group by bitAnd(number, 1) as g with totals order by g) array join [1, 2] as a format Pretty;
 select '--';
 
diff --git a/tests/queries/0_stateless/01509_check_many_parallel_quorum_inserts_long.sh b/tests/queries/0_stateless/01509_check_many_parallel_quorum_inserts_long.sh
index 1ccbe34b10a..22cd6fb8127 100755
--- a/tests/queries/0_stateless/01509_check_many_parallel_quorum_inserts_long.sh
+++ b/tests/queries/0_stateless/01509_check_many_parallel_quorum_inserts_long.sh
@@ -20,7 +20,7 @@ done
 function thread {
     i=0 retries=300
     while [[ $i -lt $retries ]]; do # server can be dead
-        $CLICKHOUSE_CLIENT --insert_quorum 3 --insert_quorum_parallel 1 --insert_keeper_fault_injection_probability=0 --query "INSERT INTO r$1 SELECT $2" && break
+        $CLICKHOUSE_CLIENT --insert_quorum 3 --insert_quorum_parallel 1 --query "INSERT INTO r$1 SELECT $2" && break
         ((++i))
         sleep 0.1
     done
diff --git a/tests/queries/0_stateless/01509_check_parallel_quorum_inserts_long.sh b/tests/queries/0_stateless/01509_check_parallel_quorum_inserts_long.sh
index 6fbdf42914c..1589f17c752 100755
--- a/tests/queries/0_stateless/01509_check_parallel_quorum_inserts_long.sh
+++ b/tests/queries/0_stateless/01509_check_parallel_quorum_inserts_long.sh
@@ -21,7 +21,7 @@ done
 $CLICKHOUSE_CLIENT -n -q "SYSTEM STOP REPLICATION QUEUES r2;"
 
 function thread {
-    $CLICKHOUSE_CLIENT --insert_quorum 2 --insert_quorum_parallel 1 --insert_keeper_fault_injection_probability=0 --query "INSERT INTO r1 SELECT $1"
+    $CLICKHOUSE_CLIENT --insert_quorum 2 --insert_quorum_parallel 1 --query "INSERT INTO r1 SELECT $1"
 }
 
 for i in $(seq 1 $NUM_INSERTS); do
diff --git a/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh b/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh
index bf88ad0e0b2..a814759ab10 100755
--- a/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh
+++ b/tests/queries/0_stateless/01509_parallel_quorum_and_merge_long.sh
@@ -20,10 +20,9 @@ $CLICKHOUSE_CLIENT -q "CREATE TABLE parallel_q2 (x UInt64) ENGINE=ReplicatedMerg
 
 $CLICKHOUSE_CLIENT -q "SYSTEM STOP REPLICATION QUEUES parallel_q2"
 
-$CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0  -q "INSERT INTO parallel_q1 VALUES (1)"
-
-# disable keeper fault injection during insert since test checks part names. Part names can differ in case of retries during insert
-$CLICKHOUSE_CLIENT --insert_quorum 2 --insert_quorum_parallel 1 --insert_keeper_fault_injection_probability=0 --query="INSERT INTO parallel_q1 VALUES (2)" &
+# This test depends on part names and those aren't deterministic with faults
+$CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0 -q "INSERT INTO parallel_q1 VALUES (1)"
+$CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0 --insert_quorum 2 --insert_quorum_parallel 1 --query="INSERT INTO parallel_q1 VALUES (2)" &
 
 part_count=$($CLICKHOUSE_CLIENT --query="SELECT COUNT() FROM system.parts WHERE table='parallel_q1' and database='${CLICKHOUSE_DATABASE}'")
 
diff --git a/tests/queries/0_stateless/01509_parallel_quorum_insert_no_replicas_long.sql b/tests/queries/0_stateless/01509_parallel_quorum_insert_no_replicas_long.sql
index 5a23473dd0a..24b368090e7 100644
--- a/tests/queries/0_stateless/01509_parallel_quorum_insert_no_replicas_long.sql
+++ b/tests/queries/0_stateless/01509_parallel_quorum_insert_no_replicas_long.sql
@@ -16,8 +16,6 @@ CREATE TABLE r2 (
 ENGINE = ReplicatedMergeTree('/clickhouse/{database}/01509_parallel_quorum_insert_no_replicas', '2')
 ORDER BY tuple();
 
-SET insert_keeper_fault_injection_probability=0;
-
 SET insert_quorum_parallel=1;
 
 SET insert_quorum=3;
diff --git a/tests/queries/0_stateless/01513_count_without_select_sequence_consistency_zookeeper_long.sql b/tests/queries/0_stateless/01513_count_without_select_sequence_consistency_zookeeper_long.sql
index 4a992449a16..f800ff86aa5 100644
--- a/tests/queries/0_stateless/01513_count_without_select_sequence_consistency_zookeeper_long.sql
+++ b/tests/queries/0_stateless/01513_count_without_select_sequence_consistency_zookeeper_long.sql
@@ -20,7 +20,6 @@ SYSTEM SYNC REPLICA quorum3;
 SET select_sequential_consistency=0;
 SET optimize_trivial_count_query=1;
 SET insert_quorum=2, insert_quorum_parallel=0;
-SET insert_keeper_fault_injection_probability=0;
 
 SYSTEM STOP FETCHES quorum1;
 
diff --git a/tests/queries/0_stateless/01513_optimize_aggregation_in_order_memory_long.sql b/tests/queries/0_stateless/01513_optimize_aggregation_in_order_memory_long.sql
index 3d57518d0f4..b107af07194 100644
--- a/tests/queries/0_stateless/01513_optimize_aggregation_in_order_memory_long.sql
+++ b/tests/queries/0_stateless/01513_optimize_aggregation_in_order_memory_long.sql
@@ -12,6 +12,7 @@ optimize table data_01513 final;
 set max_memory_usage='500M';
 set max_threads=1;
 set max_block_size=500;
+set max_bytes_before_external_group_by=0;
 
 select key, groupArray(repeat('a', 200)), count() from data_01513 group by key format Null settings optimize_aggregation_in_order=0; -- { serverError 241 }
 select key, groupArray(repeat('a', 200)), count() from data_01513 group by key format Null settings optimize_aggregation_in_order=1;
diff --git a/tests/queries/0_stateless/01514_distributed_cancel_query_on_error.sh b/tests/queries/0_stateless/01514_distributed_cancel_query_on_error.sh
index 99025890cb3..edf3683ccba 100755
--- a/tests/queries/0_stateless/01514_distributed_cancel_query_on_error.sh
+++ b/tests/queries/0_stateless/01514_distributed_cancel_query_on_error.sh
@@ -15,6 +15,7 @@ opts=(
     "--max_block_size=50"
     "--max_threads=1"
     "--max_distributed_connections=2"
+    "--max_bytes_before_external_group_by=0"
 )
 ${CLICKHOUSE_CLIENT} "${opts[@]}" -q "SELECT groupArray(repeat('a', if(_shard_num == 2, 100000, 1))), number%100000 k from remote('127.{2,3}', system.numbers) GROUP BY k LIMIT 10e6" |& {
     # the query should fail earlier on 127.3 and 127.2 should not even go to the memory limit exceeded error.
diff --git a/tests/queries/0_stateless/01532_execute_merges_on_single_replica_long.sql b/tests/queries/0_stateless/01532_execute_merges_on_single_replica_long.sql
index 30beb29251e..49ef9d8b79f 100644
--- a/tests/queries/0_stateless/01532_execute_merges_on_single_replica_long.sql
+++ b/tests/queries/0_stateless/01532_execute_merges_on_single_replica_long.sql
@@ -2,8 +2,6 @@
 -- Tag no-replicated-database: Fails due to additional replicas or shards
 -- Tag no-parallel: static zk path
 
-SET insert_keeper_fault_injection_probability=0; -- disable fault injection; part ids are non-deterministic in case of insert retries
-
 DROP TABLE IF EXISTS execute_on_single_replica_r1 SYNC;
 DROP TABLE IF EXISTS execute_on_single_replica_r2 SYNC;
 
@@ -11,7 +9,7 @@ DROP TABLE IF EXISTS execute_on_single_replica_r2 SYNC;
 CREATE TABLE execute_on_single_replica_r1 (x UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test_01532/execute_on_single_replica', 'r1') ORDER BY tuple() SETTINGS execute_merges_on_single_replica_time_threshold=10;
 CREATE TABLE execute_on_single_replica_r2 (x UInt64) ENGINE=ReplicatedMergeTree('/clickhouse/tables/test_01532/execute_on_single_replica', 'r2') ORDER BY tuple() SETTINGS execute_merges_on_single_replica_time_threshold=10;
 
-INSERT INTO execute_on_single_replica_r1 VALUES (1);
+INSERT INTO execute_on_single_replica_r1 SETTINGS insert_keeper_fault_injection_probability=0 VALUES (1);
 SYSTEM SYNC REPLICA execute_on_single_replica_r2;
 
 SET optimize_throw_if_noop=1;
diff --git a/tests/queries/0_stateless/01532_tuple_with_name_type.reference b/tests/queries/0_stateless/01532_tuple_with_name_type.reference
index f9f6b5995ce..8a3e57d9016 100644
--- a/tests/queries/0_stateless/01532_tuple_with_name_type.reference
+++ b/tests/queries/0_stateless/01532_tuple_with_name_type.reference
@@ -1,5 +1,4 @@
 a	Tuple(key String, value String)					
 a	Tuple(Tuple(key String, value String))					
-a.key	Array(String)					
-a.value	Array(String)					
+a	Array(Tuple(key String, value String))					
 a	Tuple(UInt8, Tuple(key String, value String))					
diff --git a/tests/queries/0_stateless/01543_avro_deserialization_with_lc.sh b/tests/queries/0_stateless/01543_avro_deserialization_with_lc.sh
index 6f48456f71b..697b32a77ae 100755
--- a/tests/queries/0_stateless/01543_avro_deserialization_with_lc.sh
+++ b/tests/queries/0_stateless/01543_avro_deserialization_with_lc.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT --multiquery --query "
 SET allow_suspicious_low_cardinality_types=1;
diff --git a/tests/queries/0_stateless/01556_accurate_cast_or_null.reference b/tests/queries/0_stateless/01556_accurate_cast_or_null.reference
index a2ccd5af868..5187a19cc72 100644
--- a/tests/queries/0_stateless/01556_accurate_cast_or_null.reference
+++ b/tests/queries/0_stateless/01556_accurate_cast_or_null.reference
@@ -36,6 +36,8 @@
 2023-05-30 14:38:20
 1970-01-01 00:00:19
 1970-01-01 19:26:40
+1970-01-01 00:00:00
+2106-02-07 06:28:15
 \N
 \N
 \N
diff --git a/tests/queries/0_stateless/01556_accurate_cast_or_null.sql b/tests/queries/0_stateless/01556_accurate_cast_or_null.sql
index 2fb7b1177e6..15ac71dea93 100644
--- a/tests/queries/0_stateless/01556_accurate_cast_or_null.sql
+++ b/tests/queries/0_stateless/01556_accurate_cast_or_null.sql
@@ -39,9 +39,12 @@ SELECT accurateCastOrNull(number + 127, 'Int8') AS x FROM numbers (2) ORDER BY x
 SELECT accurateCastOrNull(-1, 'DateTime');
 SELECT accurateCastOrNull(5000000000, 'DateTime');
 SELECT accurateCastOrNull('1xxx', 'DateTime');
-select toString(accurateCastOrNull('2023-05-30 14:38:20', 'DateTime'), timezone());
+SELECT toString(accurateCastOrNull('2023-05-30 14:38:20', 'DateTime'), timezone());
 SELECT toString(accurateCastOrNull(19, 'DateTime'), 'UTC');
 SELECT toString(accurateCastOrNull(70000, 'DateTime'), 'UTC');
+-- need fixed timezone in these two lines
+SELECT toString(accurateCastOrNull('1965-05-30 14:38:20', 'DateTime'), timezone()) SETTINGS session_timezone = 'UTC';
+SELECT toString(accurateCastOrNull('2223-05-30 14:38:20', 'DateTime'), timezone()) SETTINGS session_timezone = 'UTC';
 
 SELECT accurateCastOrNull(-1, 'Date');
 SELECT accurateCastOrNull(5000000000, 'Date');
diff --git a/tests/queries/0_stateless/01563_distributed_query_finish.sh b/tests/queries/0_stateless/01563_distributed_query_finish.sh
index b49042ead9d..0019c714e40 100755
--- a/tests/queries/0_stateless/01563_distributed_query_finish.sh
+++ b/tests/queries/0_stateless/01563_distributed_query_finish.sh
@@ -28,7 +28,7 @@ opts=(
     "--prefer_localhost_replica=0"
 )
 $CLICKHOUSE_CLIENT "${opts[@]}" --format CSV -nm <<EOL
-select count(), * from dist_01247 group by number limit 1;
+select count(), * from dist_01247 group by number order by number limit 1;
 EOL
 
 # expect zero new network errors
diff --git a/tests/queries/0_stateless/01591_window_functions.sql b/tests/queries/0_stateless/01591_window_functions.sql
index 07e323b3c40..952a66616a9 100644
--- a/tests/queries/0_stateless/01591_window_functions.sql
+++ b/tests/queries/0_stateless/01591_window_functions.sql
@@ -2,6 +2,10 @@
 
 SET allow_experimental_analyzer = 1;
 
+-- Too slow
+SET max_bytes_before_external_sort = 0;
+SET max_bytes_before_external_group_by = 0;
+
 -- { echo }
 
 -- just something basic
diff --git a/tests/queries/0_stateless/01600_parts_states_metrics_long.reference b/tests/queries/0_stateless/01600_parts_states_metrics_long.reference
deleted file mode 100644
index 98fb6a68656..00000000000
--- a/tests/queries/0_stateless/01600_parts_states_metrics_long.reference
+++ /dev/null
@@ -1,4 +0,0 @@
-1
-1
-1
-1
diff --git a/tests/queries/0_stateless/01600_parts_states_metrics_long.sh b/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
deleted file mode 100755
index 89ce84f6dbc..00000000000
--- a/tests/queries/0_stateless/01600_parts_states_metrics_long.sh
+++ /dev/null
@@ -1,40 +0,0 @@
-#!/usr/bin/env bash
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-# NOTE: database = $CLICKHOUSE_DATABASE is unwanted
-verify_sql="SELECT
-    (SELECT sumIf(value, metric = 'PartsActive'), sumIf(value, metric = 'PartsOutdated') FROM system.metrics)
-    = (SELECT sum(active), sum(NOT active) FROM
-    (SELECT active FROM system.parts UNION ALL SELECT active FROM system.projection_parts))"
-
-# The query is not atomic - it can compare states between system.parts and system.metrics from different points in time.
-# So, there is inherent race condition. But it should get expected result eventually.
-# In case of test failure, this code will do infinite loop and timeout.
-verify()
-{
-    while true
-    do
-        result=$( $CLICKHOUSE_CLIENT -m --query="$verify_sql" )
-        [ "$result" = "1" ] && break
-        sleep 0.1
-    done
-    echo 1
-}
-
-$CLICKHOUSE_CLIENT --database_atomic_wait_for_drop_and_detach_synchronously=1 --query="DROP TABLE IF EXISTS test_table"
-$CLICKHOUSE_CLIENT --query="CREATE TABLE test_table(data Date) ENGINE = MergeTree  PARTITION BY toYear(data) ORDER BY data;"
-
-$CLICKHOUSE_CLIENT --query="INSERT INTO test_table VALUES ('1992-01-01')"
-verify
-
-$CLICKHOUSE_CLIENT --query="INSERT INTO test_table VALUES ('1992-01-02')"
-verify
-
-$CLICKHOUSE_CLIENT --query="OPTIMIZE TABLE test_table FINAL"
-verify
-
-$CLICKHOUSE_CLIENT --database_atomic_wait_for_drop_and_detach_synchronously=1 --query="DROP TABLE test_table"
-verify
diff --git a/tests/queries/0_stateless/01603_decimal_mult_float.reference b/tests/queries/0_stateless/01603_decimal_mult_float.reference
index 4c9d45423ee..72b10d768f1 100644
--- a/tests/queries/0_stateless/01603_decimal_mult_float.reference
+++ b/tests/queries/0_stateless/01603_decimal_mult_float.reference
@@ -1,14 +1,14 @@
 2.4
 10.165
-0.00012000000000000002
-150.16500000000002
-7.775900000000001
-56.622689999999984
-598.8376688440277
-299.41883695311844
-0.7485470860550345
-2.2456412771483882
-1.641386318314034
-1.641386318314034
-1.6413863258732018
-1.6413863258732018
+0.00012
+150.165
+7.7759
+56.62269
+598.837669
+299.418837
+0.748547
+2.245641
+1.641386
+1.641386
+1.641386
+1.641386
diff --git a/tests/queries/0_stateless/01603_decimal_mult_float.sql b/tests/queries/0_stateless/01603_decimal_mult_float.sql
index 799ab91d332..1a4652df23a 100644
--- a/tests/queries/0_stateless/01603_decimal_mult_float.sql
+++ b/tests/queries/0_stateless/01603_decimal_mult_float.sql
@@ -1,9 +1,9 @@
 SET optimize_arithmetic_operations_in_aggregate_functions = 0;
 
-SELECT toDecimal32(2, 2) * 1.2;
-SELECT toDecimal64(0.5, 2) * 20.33;
-SELECT 0.00001 * toDecimal32(12, 2);
-SELECT 30.033 * toDecimal32(5, 1);
+SELECT round(toDecimal32(2, 2) * 1.2, 6);
+SELECT round(toDecimal64(0.5, 2) * 20.33, 6);
+SELECT round(0.00001 * toDecimal32(12, 2), 6);
+SELECT round(30.033 * toDecimal32(5, 1), 6);
 
 CREATE TABLE IF NOT EXISTS test01603 (
     f64 Float64,
@@ -13,17 +13,17 @@ CREATE TABLE IF NOT EXISTS test01603 (
 
 INSERT INTO test01603(f64) SELECT 1 / (number + 1) FROM system.numbers LIMIT 1000;
 
-SELECT sum(d * 1.1) FROM test01603;
-SELECT sum(8.01 * d) FROM test01603;
+SELECT round(sum(d * 1.1), 6) FROM test01603;
+SELECT round(sum(8.01 * d), 6) FROM test01603;
 
-SELECT sum(f64 * toDecimal64(80, 2)) FROM test01603;
-SELECT sum(toDecimal64(40, 2) * f32) FROM test01603;
-SELECT sum(f64 * toDecimal64(0.1, 2)) FROM test01603;
-SELECT sum(toDecimal64(0.3, 2) * f32) FROM test01603;
+SELECT round(sum(f64 * toDecimal64(80, 2)), 6) FROM test01603;
+SELECT round(sum(toDecimal64(40, 2) * f32), 6) FROM test01603;
+SELECT round(sum(f64 * toDecimal64(0.1, 2)), 6) FROM test01603;
+SELECT round(sum(toDecimal64(0.3, 2) * f32), 6) FROM test01603;
 
-SELECT sum(f64 * d) FROM test01603;
-SELECT sum(d * f64) FROM test01603;
-SELECT sum(f32 * d) FROM test01603;
-SELECT sum(d * f32) FROM test01603;
+SELECT round(sum(f64 * d), 6) FROM test01603;
+SELECT round(sum(d * f64), 6) FROM test01603;
+SELECT round(sum(f32 * d), 6) FROM test01603;
+SELECT round(sum(d * f32), 6) FROM test01603;
 
 DROP TABLE IF EXISTS test01603;
diff --git a/tests/queries/0_stateless/01622_constraints_where_optimization.sql b/tests/queries/0_stateless/01622_constraints_where_optimization.sql
index 2818351a120..d41b1988bdd 100644
--- a/tests/queries/0_stateless/01622_constraints_where_optimization.sql
+++ b/tests/queries/0_stateless/01622_constraints_where_optimization.sql
@@ -1,5 +1,6 @@
 SET convert_query_to_cnf = 1;
 SET optimize_using_constraints = 1;
+SET optimize_append_index = 0;
 
 DROP TABLE IF EXISTS t_constraints_where;
 
diff --git a/tests/queries/0_stateless/01650_fetch_patition_with_macro_in_zk_path_long.sql b/tests/queries/0_stateless/01650_fetch_patition_with_macro_in_zk_path_long.sql
index f4afcb8d55e..029a17f87dc 100644
--- a/tests/queries/0_stateless/01650_fetch_patition_with_macro_in_zk_path_long.sql
+++ b/tests/queries/0_stateless/01650_fetch_patition_with_macro_in_zk_path_long.sql
@@ -4,7 +4,7 @@ DROP TABLE IF EXISTS test_01640;
 DROP TABLE IF EXISTS restore_01640;
 
 CREATE TABLE test_01640(i Int64, d Date, s String)
-ENGINE = ReplicatedMergeTree('/clickhouse/{database}/{shard}/tables/test_01640','{replica}') 
+ENGINE = ReplicatedMergeTree('/clickhouse/{database}/{shard}/tables/test_01640','{replica}')
 PARTITION BY toYYYYMM(d) ORDER BY i
 SETTINGS allow_remote_fs_zero_copy_replication=0;
 
@@ -16,13 +16,13 @@ PARTITION BY toYYYYMM(d) ORDER BY i
 SETTINGS allow_remote_fs_zero_copy_replication=0;
 
 ALTER TABLE restore_01640 FETCH PARTITION tuple(toYYYYMM(toDate('2021-01-01')))
-  FROM '/clickhouse/{database}/{shard}/tables/test_01640';
+  FROM '/clickhouse/{database}/{shard}/tables/test_01640' SETTINGS insert_keeper_fault_injection_probability=0;
 
 SELECT partition_id
 FROM system.detached_parts
 WHERE (table = 'restore_01640') AND (database = currentDatabase());
 
-ALTER TABLE restore_01640 ATTACH PARTITION tuple(toYYYYMM(toDate('2021-01-01')));
+ALTER TABLE restore_01640 ATTACH PARTITION tuple(toYYYYMM(toDate('2021-01-01'))) SETTINGS insert_keeper_fault_injection_probability=0;;
 
 SELECT partition_id
 FROM system.detached_parts
diff --git a/tests/queries/0_stateless/01658_substring_ubsan.sql b/tests/queries/0_stateless/01658_substring_ubsan.sql
deleted file mode 100644
index 3d7968b8d6b..00000000000
--- a/tests/queries/0_stateless/01658_substring_ubsan.sql
+++ /dev/null
@@ -1,10 +0,0 @@
-/** NOTE: The behaviour of substring and substringUTF8 is inconsistent when negative offset is greater than string size:
-  * substring:
-  *      hello
-  * ^-----^ - offset -10, length 7, result: "he"
-  * substringUTF8:
-  *      hello
-  *      ^-----^ - offset -10, length 7, result: "hello"
-  * This may be subject for change.
-  */
-SELECT substringUTF8('hello, Ð¿Ñ�Ð¸Ð²ÐµÑ�', -9223372036854775808, number) FROM numbers(16) FORMAT Null;
diff --git a/tests/queries/0_stateless/01684_ssd_cache_dictionary_simple_key.sh b/tests/queries/0_stateless/01684_ssd_cache_dictionary_simple_key.sh
index 5a030bfdfaf..9167a2d306f 100755
--- a/tests/queries/0_stateless/01684_ssd_cache_dictionary_simple_key.sh
+++ b/tests/queries/0_stateless/01684_ssd_cache_dictionary_simple_key.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT -n --query="
     DROP DATABASE IF EXISTS 01684_database_for_cache_dictionary;
diff --git a/tests/queries/0_stateless/01685_ssd_cache_dictionary_complex_key.sh b/tests/queries/0_stateless/01685_ssd_cache_dictionary_complex_key.sh
index 7f47ce1438f..9dd8a41ce5a 100755
--- a/tests/queries/0_stateless/01685_ssd_cache_dictionary_complex_key.sh
+++ b/tests/queries/0_stateless/01685_ssd_cache_dictionary_complex_key.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT -n --query="
     DROP DATABASE IF EXISTS 01685_database_for_cache_dictionary;
diff --git a/tests/queries/0_stateless/01705_normalize_create_alter_function_names.reference b/tests/queries/0_stateless/01705_normalize_create_alter_function_names.reference
index b5b93c34c00..75598e15320 100644
--- a/tests/queries/0_stateless/01705_normalize_create_alter_function_names.reference
+++ b/tests/queries/0_stateless/01705_normalize_create_alter_function_names.reference
@@ -1,2 +1,2 @@
 CREATE TABLE default.x\n(\n    `i` Int32,\n    INDEX mm log2(i) TYPE minmax GRANULARITY 1,\n    INDEX nn log2(i) TYPE minmax GRANULARITY 1,\n    PROJECTION p\n    (\n        SELECT max(i)\n    ),\n    PROJECTION p2\n    (\n        SELECT min(i)\n    )\n)\nENGINE = ReplicatedMergeTree(\'/clickhouse/tables/default/x\', \'r\')\nORDER BY i\nSETTINGS index_granularity = 8192
-metadata format version: 1\ndate column: \nsampling expression: \nindex granularity: 8192\nmode: 0\nsign column: \nprimary key: i\ndata format version: 1\npartition key: \nindices: mm log2(i) TYPE minmax GRANULARITY 1, nn log2(i) TYPE minmax GRANULARITY 1\nprojections: p (SELECT max(i)), p2 (SELECT min(i))\ngranularity bytes: 10485760\n
+metadata format version: 1\ndate column: \nsampling expression: \nindex granularity: 8192\nmode: 0\nsign column: \nprimary key: i\ndata format version: 1\npartition key: \nindices: mm log2(i) TYPE minmax GRANULARITY 1, nn log2(i) TYPE minmax GRANULARITY 1\nprojections: p (SELECT max(i)), p2 (SELECT min(i))\ngranularity bytes: 10485760\nmerge parameters format version: 2\n
diff --git a/tests/queries/0_stateless/01710_aggregate_projections.sh b/tests/queries/0_stateless/01710_aggregate_projections.sh
index 326a564a208..7ea40365937 100755
--- a/tests/queries/0_stateless/01710_aggregate_projections.sh
+++ b/tests/queries/0_stateless/01710_aggregate_projections.sh
@@ -4,6 +4,8 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+# Number of read rows depends on max_bytes_before_external_group_by.
+CLICKHOUSE_CLIENT="$CLICKHOUSE_CLIENT --max_bytes_before_external_group_by 0"
 
 $CLICKHOUSE_CLIENT -q "CREATE TABLE test_agg_proj (x Int32, y Int32, PROJECTION x_plus_y (SELECT sum(x - y), argMax(x, y) group by x + y)) ENGINE = MergeTree ORDER BY tuple() settings index_granularity = 1"
 $CLICKHOUSE_CLIENT -q "insert into test_agg_proj select intDiv(number, 2), -intDiv(number,3) - 1 from numbers(100)"
diff --git a/tests/queries/0_stateless/01732_race_condition_storage_join_long.sh b/tests/queries/0_stateless/01732_race_condition_storage_join_long.sh
index 48e726aca9d..5fc41890a18 100755
--- a/tests/queries/0_stateless/01732_race_condition_storage_join_long.sh
+++ b/tests/queries/0_stateless/01732_race_condition_storage_join_long.sh
@@ -15,7 +15,7 @@ echo "
 
 function read_thread_big()
 {
-    while true; do 
+    while true; do
         echo "
             SELECT * FROM ( SELECT number AS x FROM numbers(100000) ) AS t1 ALL FULL JOIN storage_join_race USING (x) FORMAT Null;
         " | $CLICKHOUSE_CLIENT -n
@@ -24,7 +24,7 @@ function read_thread_big()
 
 function read_thread_small()
 {
-    while true; do 
+    while true; do
         echo "
             SELECT * FROM ( SELECT number AS x FROM numbers(10) ) AS t1 ALL FULL JOIN storage_join_race USING (x) FORMAT Null;
         " | $CLICKHOUSE_CLIENT -n
@@ -51,8 +51,11 @@ timeout $TIMEOUT bash -c read_thread_big 2> /dev/null &
 timeout $TIMEOUT bash -c read_thread_small 2> /dev/null &
 timeout $TIMEOUT bash -c read_thread_select 2> /dev/null &
 
+# Run insert query with a sleep to make sure that it is executed all the time during the read queries.
 echo "
-    INSERT INTO storage_join_race SELECT number AS x, number AS y FROM numbers (10000000);
+    INSERT INTO storage_join_race
+        SELECT number AS x, sleepEachRow(0.1) + number AS y FROM numbers ($TIMEOUT * 10)
+        SETTINGS function_sleep_max_microseconds_per_block = 100000000, max_block_size = 10;
 " | $CLICKHOUSE_CLIENT -n
 
 wait
diff --git a/tests/queries/0_stateless/01799_long_uniq_theta_sketch.sql b/tests/queries/0_stateless/01799_long_uniq_theta_sketch.sql
index 37f0c31ab10..9cd75de6abc 100644
--- a/tests/queries/0_stateless/01799_long_uniq_theta_sketch.sql
+++ b/tests/queries/0_stateless/01799_long_uniq_theta_sketch.sql
@@ -1,5 +1,8 @@
 -- Tags: long, no-fasttest
 
+-- The result slightly differs but it's ok since `uniqueTheta` is an approximate function.
+set max_bytes_before_external_group_by = 0;
+
 SELECT 'uniqTheta';
 
 SELECT Y, uniqTheta(X) FROM (SELECT number AS X, (3*X*X - 7*X + 11) % 37 AS Y FROM system.numbers LIMIT 15) GROUP BY Y ORDER BY Y;
diff --git a/tests/queries/0_stateless/01825_type_json_btc.sh b/tests/queries/0_stateless/01825_type_json_btc.sh
index f11b952ae3b..1e74166e7a7 100755
--- a/tests/queries/0_stateless/01825_type_json_btc.sh
+++ b/tests/queries/0_stateless/01825_type_json_btc.sh
@@ -5,7 +5,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}/*
 cp $CUR_DIR/data_json/btc_transactions.json ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
diff --git a/tests/queries/0_stateless/01825_type_json_schema_inference.sh b/tests/queries/0_stateless/01825_type_json_schema_inference.sh
index 851751ead43..5fca608d8bb 100755
--- a/tests/queries/0_stateless/01825_type_json_schema_inference.sh
+++ b/tests/queries/0_stateless/01825_type_json_schema_inference.sh
@@ -10,7 +10,7 @@ ${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS t_json_inference"
 ${CLICKHOUSE_CLIENT} -q "CREATE TABLE t_json_inference (id UInt64, obj Object(Nullable('json')), s String) \
     ENGINE = MergeTree ORDER BY id" --allow_experimental_object_type 1
 
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}/*
 
@@ -35,4 +35,3 @@ ${CLICKHOUSE_CLIENT} -q "INSERT INTO t_json_inference SELECT * FROM file('${CLIC
 ${CLICKHOUSE_CLIENT} -q "SELECT * FROM t_json_inference FORMAT JSONEachRow" --output_format_json_named_tuples_as_objects 1
 
 ${CLICKHOUSE_CLIENT} -q "DROP TABLE IF EXISTS t_json_inference"
-
diff --git a/tests/queries/0_stateless/01875_ssd_cache_dictionary_decimal256_type.sh b/tests/queries/0_stateless/01875_ssd_cache_dictionary_decimal256_type.sh
index 806fbd05fbf..36a2165329b 100755
--- a/tests/queries/0_stateless/01875_ssd_cache_dictionary_decimal256_type.sh
+++ b/tests/queries/0_stateless/01875_ssd_cache_dictionary_decimal256_type.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT -n --query="
     SET allow_experimental_bigint_types = 1;
diff --git a/tests/queries/0_stateless/01889_sqlite_read_write.sh b/tests/queries/0_stateless/01889_sqlite_read_write.sh
index 7691d2e3c2c..02b9a649e94 100755
--- a/tests/queries/0_stateless/01889_sqlite_read_write.sh
+++ b/tests/queries/0_stateless/01889_sqlite_read_write.sh
@@ -6,7 +6,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CUR_DIR"/../shell_config.sh
 
 # See 01658_read_file_to_string_column.sh
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p "${user_files_path}/"
 chmod 777 "${user_files_path}"
diff --git a/tests/queries/0_stateless/01903_ssd_cache_dictionary_array_type.sh b/tests/queries/0_stateless/01903_ssd_cache_dictionary_array_type.sh
index b1d6049abcf..3676f1429b2 100755
--- a/tests/queries/0_stateless/01903_ssd_cache_dictionary_array_type.sh
+++ b/tests/queries/0_stateless/01903_ssd_cache_dictionary_array_type.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT -n --query="
     DROP TABLE IF EXISTS dictionary_array_source_table;
diff --git a/tests/queries/0_stateless/01904_ssd_cache_dictionary_default_nullable_type.sh b/tests/queries/0_stateless/01904_ssd_cache_dictionary_default_nullable_type.sh
index 07d2ac7baad..6aecb20329a 100755
--- a/tests/queries/0_stateless/01904_ssd_cache_dictionary_default_nullable_type.sh
+++ b/tests/queries/0_stateless/01904_ssd_cache_dictionary_default_nullable_type.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT -n --query="
     DROP TABLE IF EXISTS dictionary_nullable_source_table;
diff --git a/tests/queries/0_stateless/01913_exact_rows_before_limit_full.reference b/tests/queries/0_stateless/01913_exact_rows_before_limit_full.reference
index a0f4560ca1c..95ce4d6428d 100644
--- a/tests/queries/0_stateless/01913_exact_rows_before_limit_full.reference
+++ b/tests/queries/0_stateless/01913_exact_rows_before_limit_full.reference
@@ -45,7 +45,7 @@
 
 	"data":
 	[
-		[12]
+		[10]
 	],
 
 	"rows": 1,
diff --git a/tests/queries/0_stateless/01913_exact_rows_before_limit_full.sql b/tests/queries/0_stateless/01913_exact_rows_before_limit_full.sql
index 84f97090169..07e54fb2ec2 100644
--- a/tests/queries/0_stateless/01913_exact_rows_before_limit_full.sql
+++ b/tests/queries/0_stateless/01913_exact_rows_before_limit_full.sql
@@ -10,20 +10,20 @@ set exact_rows_before_limit = 1, output_format_write_statistics = 0, max_block_s
 
 select * from test limit 1 FORMAT JSONCompact;
 
-select * from test where i < 10 group by i limit 1 FORMAT JSONCompact;
+select * from test where i < 10 group by i order by i limit 1 FORMAT JSONCompact;
 
-select * from test group by i having i in (10, 11, 12) limit 1 FORMAT JSONCompact;
+select * from test group by i having i in (10, 11, 12) order by i limit 1 FORMAT JSONCompact;
 
 select * from test where i < 20 order by i limit 1 FORMAT JSONCompact;
 
 set prefer_localhost_replica = 0;
-select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 30 limit 1 FORMAT JSONCompact;
+select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 30 order by i limit 1 FORMAT JSONCompact;
 select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 20 order by i limit 1 FORMAT JSONCompact;
 
 set prefer_localhost_replica = 1;
-select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 30 limit 1 FORMAT JSONCompact;
+select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 30 order by i limit 1 FORMAT JSONCompact;
 select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 20 order by i limit 1 FORMAT JSONCompact;
 
-select * from (select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 10) limit 1 FORMAT JSONCompact;
+select * from (select * from cluster(test_cluster_two_shards, currentDatabase(), test) where i < 10) order by i limit 1 FORMAT JSONCompact;
 
 drop table if exists test;
diff --git a/tests/queries/0_stateless/01946_test_zstd_decompression_with_escape_sequence_at_the_end_of_buffer.sh b/tests/queries/0_stateless/01946_test_zstd_decompression_with_escape_sequence_at_the_end_of_buffer.sh
index 2f8d8f06dee..4b230e4f738 100755
--- a/tests/queries/0_stateless/01946_test_zstd_decompression_with_escape_sequence_at_the_end_of_buffer.sh
+++ b/tests/queries/0_stateless/01946_test_zstd_decompression_with_escape_sequence_at_the_end_of_buffer.sh
@@ -7,7 +7,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 
 
 # See 01658_read_file_to_string_column.sh
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 mkdir -p ${user_files_path}/
 cp $CUR_DIR/data_zstd/test_01946.zstd ${user_files_path}/
 
@@ -19,4 +19,3 @@ select * from file('test_01946.zstd', 'JSONEachRow', 'foo String') order by foo
 set input_format_parallel_parsing = 1;
 select * from file('test_01946.zstd', 'JSONEachRow', 'foo String') order by foo limit 30 format Null;
 "
-
diff --git a/tests/queries/0_stateless/02000_join_on_const.reference b/tests/queries/0_stateless/02000_join_on_const.reference
index 31fd89d7ec6..848ecedf9e3 100644
--- a/tests/queries/0_stateless/02000_join_on_const.reference
+++ b/tests/queries/0_stateless/02000_join_on_const.reference
@@ -54,3 +54,18 @@ SELECT * FROM t1 FULL JOIN t2 ON t1.id = t2.id AND 1 = 2 SETTINGS allow_experime
 2	0
 0	2
 0	3
+SELECT * FROM (SELECT 1 as a) as t1 INNER JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+SELECT * FROM (SELECT 1 as a) as t1 LEFT JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+1	('',0)
+SELECT * FROM (SELECT 1 as a) as t1 RIGHT JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+0	('b',256)
+SELECT * FROM (SELECT 1 as a) as t1 FULL JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+1	('',0)
+0	('b',256)
+SELECT * FROM (SELECT 1 as a) as t1 SEMI JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+SELECT * FROM (SELECT 1 as a) as t1 ANTI JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+1	('',0)
+2
+4	2	Nullable(UInt64)	UInt8
+4	2	UInt64	Nullable(UInt8)
+4	2	Nullable(UInt64)	Nullable(UInt8)
diff --git a/tests/queries/0_stateless/02000_join_on_const.sql b/tests/queries/0_stateless/02000_join_on_const.sql
index 21204796168..a68e75443d8 100644
--- a/tests/queries/0_stateless/02000_join_on_const.sql
+++ b/tests/queries/0_stateless/02000_join_on_const.sql
@@ -81,8 +81,40 @@ SELECT * FROM t1 LEFT JOIN t2 ON t1.id = t2.id AND 1 = 2 SETTINGS allow_experime
 SELECT * FROM t1 RIGHT JOIN t2 ON t1.id = t2.id AND 1 = 2 SETTINGS allow_experimental_analyzer = 1;
 SELECT * FROM t1 FULL JOIN t2 ON t1.id = t2.id AND 1 = 2 SETTINGS allow_experimental_analyzer = 1;
 
+SELECT * FROM (SELECT 1 as a) as t1 INNER JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+SELECT * FROM (SELECT 1 as a) as t1 LEFT JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+SELECT * FROM (SELECT 1 as a) as t1 RIGHT JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+SELECT * FROM (SELECT 1 as a) as t1 FULL JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+SELECT * FROM (SELECT 1 as a) as t1 SEMI JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+SELECT * FROM (SELECT 1 as a) as t1 ANTI JOIN  ( SELECT ('b', 256) as b ) AS t2 ON NULL;
+
 -- { echoOff }
 
+SELECT a + 1
+FROM (SELECT 1 as x) as t1
+LEFT JOIN ( SELECT 1 AS a ) AS t2
+ON TRUE
+SETTINGS allow_experimental_analyzer=1, join_use_nulls=1;
+
+SELECT a + 1, x + 1, toTypeName(a), toTypeName(x)
+FROM (SELECT 1 as x) as t1
+LEFT JOIN ( SELECT sum(number) as a from numbers(3) GROUP BY NULL) AS t2
+ON TRUE
+SETTINGS allow_experimental_analyzer=1, join_use_nulls=1;
+
+SELECT a + 1, x + 1, toTypeName(a), toTypeName(x)
+FROM (SELECT 1 as x) as t1
+RIGHT JOIN ( SELECT sum(number) as a from numbers(3) GROUP BY NULL) AS t2
+ON TRUE
+SETTINGS allow_experimental_analyzer=1, join_use_nulls=1;
+
+SELECT a + 1, x + 1, toTypeName(a), toTypeName(x)
+FROM (SELECT 1 as x) as t1
+FULL JOIN ( SELECT sum(number) as a from numbers(3) GROUP BY NULL) AS t2
+ON TRUE
+SETTINGS allow_experimental_analyzer=1, join_use_nulls=1;
+
+
 DROP TABLE IF EXISTS t1;
 DROP TABLE IF EXISTS t2;
 
diff --git a/tests/queries/0_stateless/02003_compress_bz2.sh b/tests/queries/0_stateless/02003_compress_bz2.sh
index afcea410297..b17effb20b6 100755
--- a/tests/queries/0_stateless/02003_compress_bz2.sh
+++ b/tests/queries/0_stateless/02003_compress_bz2.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 WORKING_FOLDER_02003="${USER_FILES_PATH}/${CLICKHOUSE_DATABASE}"
 
 rm -rf "${WORKING_FOLDER_02003}"
diff --git a/tests/queries/0_stateless/02012_compress_lz4.sh b/tests/queries/0_stateless/02012_compress_lz4.sh
index 1823718fc9c..aad437c8011 100755
--- a/tests/queries/0_stateless/02012_compress_lz4.sh
+++ b/tests/queries/0_stateless/02012_compress_lz4.sh
@@ -4,7 +4,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 WORKING_FOLDER_02012="${USER_FILES_PATH}/${CLICKHOUSE_DATABASE}"
 
 rm -rf "${WORKING_FOLDER_02012}"
diff --git a/tests/queries/0_stateless/02012_sha512_fixedstring.reference b/tests/queries/0_stateless/02012_sha512_fixedstring.reference
index dfc2f87087c..93303a23fe1 100644
--- a/tests/queries/0_stateless/02012_sha512_fixedstring.reference
+++ b/tests/queries/0_stateless/02012_sha512_fixedstring.reference
@@ -1,5 +1,7 @@
 CF83E1357EEFB8BDF1542850D66D8007D620E4050B5715DC83F4A921D36CE9CE47D0D13C5D85F2B0FF8318D2877EEC2F63B931BD47417A81A538327AF927DA3E
 DDAF35A193617ABACC417349AE20413112E6FA4E89A97EA20A9EEEE64B55D39A2192992A274FC1A836BA3C23A3FEEBBD454D4423643CE80E2A9AC94FA54CA49F
+C672B8D1EF56ED28AB87C3622C5114069BDD3AD7B8F9737498D0C01ECEF0967A
+53048E2681941EF99B2E29B76B4C7DABE4C2D0C634FC6D46E0E2F13107E7AF23
 5809F3ECB4AA006F71AF562D4381F2BF64EA0931FD530E939740D0C38F6EEB2A71FA0113A21C170569D8319B8C4DE8A1C1A5ABA1A1C5B23A886B06712D373B9E
 6FDB5E5BCCBD093ECC48DD262A99E6B867D6F48E1DAE014D26428365E7529B0022F000CBF852BEA38F43A2034E8FE7555AC41B9EA9E27FE72F4E968926998EA8
 8018978D8AAE19322205E4CACFA045CDF7A0C4A5773A93FD24331064AFC5726F324B76802AA6FC30DFC412A6E5C3EEF4693AE4E2D0A1EA24A2D3EC46439B7923
@@ -20,3 +22,23 @@ E7A061D9B066E2CA44CF959A76FC04D8B02998CB9D46A60C19E015EA9389F3F9595CBBC4CC46E131
 3438D75650E1EDB8A11EF4F63A5DFF239A70B28B6A14F13FCFDD14D02BE8BD00E84DF956C159CFDC85D6E44DB62D00E9206F40453FFD9CC97C38449527D33FF6
 DB229C3A53B0340E94EFDA4D03B54F161313699757CAC312F377B731AE6C62010E0C0010E78F73E6D6B0BB438F644D176244B2614897799F9FA3F85DA980C218
 FDD9FD54050D95855B8E3A34F3A54E309E1CA87CD44A8506EB10051D1CA650DB64ABD0BE4F4F44E45F630C22CA270FA7694AC2261DF2EFD766B8CED53F285A27
+99B13DC7BAF988EC34949E59E636884214C0155DA3BE69605F9DBEE0F9BB26FD
+C93FBA93074FDEF8301B66D8DB835BFA2D50616EA108EC32CF617A7A40AF9746
+03CBA6DD6F5410B8E3E18D5271CAA786B2E67D8BE8281C893886B677C6A6F28D
+BB612013EC3039A5943037FE9D92D976F85E8B69A3729019D674581DF101181A
+40AC3D10E1820DBB473DC04CD32CCC14294F7BE5B3298C3BCC88F7F6AD7FCEB0
+659A9B47C2EC80125CB790FFCB1E234F2D33A93F6CF86DEF501305977A03BC75
+C03E2022A819F90B11FE1686C2827F67138B4DE7677C14D08972055336958263
+801A5F66EE0CD5EB1C214A9E61C3C4558A6795262E5A70D22AA392087F5C019D
+AAD6E69EA25EECBC0A26CB60F9E2EBA878637A7CAA0CDF325D29C2516CE9D1A6
+B0B7F2E5E00E1F44578540A0B34138133654CA4803C245834D8C720BC46E6ADD
+6475E517346B8C888418E1610E28969D10583CF431D05916A7DEE49633FE6279
+43A8BFDFBA86848376580714584F699E9775B7B31DDB7C4BBF0530D97564F5F9
+3B10D6BC94B31128583716432192F1B60D7BC23282A099F343CD5BB79323CD48
+B23EC2FC5B9D07E1853D50372600C8AEBA77F571B364D2D7D05E7B47ABA3E679
+F0DAA6078297F475B7E3B3968A2227A645DAA2ABA7426700532DCE1A04B67DB0
+4084B1624E1D9F5F80EE65C216316269E14A42CDF8607A651DFC602319CF9C66
+B63FBA87B2DCB490EE45B39F660A9DEFBD5383774B1C81D7A8CF9DE4C3FAA190
+BC70EB3AFD6D8252C92BB655920FFDCCC8239E99476697F1CDD4F847533671AC
+6388E69B35B7A80469CD4C4EB49568C3143FEE6143112009120088A8607CC676
+7CE6CDE5DDE81925E714717F01771325298381B1934B021590965B30D23EC1C9
diff --git a/tests/queries/0_stateless/02012_sha512_fixedstring.sql b/tests/queries/0_stateless/02012_sha512_fixedstring.sql
index cd014a58e65..ca9520350db 100644
--- a/tests/queries/0_stateless/02012_sha512_fixedstring.sql
+++ b/tests/queries/0_stateless/02012_sha512_fixedstring.sql
@@ -4,6 +4,9 @@
 SELECT hex(SHA512(''));
 SELECT hex(SHA512('abc'));
 
+SELECT hex(SHA512_256(''));
+SELECT hex(SHA512_256('abc'));
+
 DROP TABLE IF EXISTS defaults;
 CREATE TABLE defaults
 (
@@ -13,5 +16,6 @@ CREATE TABLE defaults
 INSERT INTO defaults SELECT s FROM generateRandom('s FixedString(20)', 1, 1, 1) LIMIT 20;
 
 SELECT hex(SHA512(s)) FROM defaults;
+SELECT hex(SHA512_256(s)) FROM defaults;
 
 DROP TABLE defaults;
diff --git a/tests/queries/0_stateless/02022_storage_filelog_one_file.sh b/tests/queries/0_stateless/02022_storage_filelog_one_file.sh
index 32ce1643d4e..ea703d69aa5 100755
--- a/tests/queries/0_stateless/02022_storage_filelog_one_file.sh
+++ b/tests/queries/0_stateless/02022_storage_filelog_one_file.sh
@@ -9,7 +9,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Data preparation.
 # Now we can get the user_files_path by use the table file function for trick. also we can get it by query as:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 for i in {1..20}
 do
diff --git a/tests/queries/0_stateless/02023_storage_filelog.sh b/tests/queries/0_stateless/02023_storage_filelog.sh
index 71ed5ba5471..51c8dc8ab3e 100755
--- a/tests/queries/0_stateless/02023_storage_filelog.sh
+++ b/tests/queries/0_stateless/02023_storage_filelog.sh
@@ -9,7 +9,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Data preparation.
 # Now we can get the user_files_path by use the table file function for trick. also we can get it by query as:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 
diff --git a/tests/queries/0_stateless/02024_storage_filelog_mv.sh b/tests/queries/0_stateless/02024_storage_filelog_mv.sh
index 67aa825ac67..33c8693648c 100755
--- a/tests/queries/0_stateless/02024_storage_filelog_mv.sh
+++ b/tests/queries/0_stateless/02024_storage_filelog_mv.sh
@@ -10,7 +10,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Data preparation.
 # Now we can get the user_files_path by use the table file function for trick. also we can get it by query as:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}/*
diff --git a/tests/queries/0_stateless/02025_storage_filelog_virtual_col.sh b/tests/queries/0_stateless/02025_storage_filelog_virtual_col.sh
index 0219a0421cb..f027b61c3ef 100755
--- a/tests/queries/0_stateless/02025_storage_filelog_virtual_col.sh
+++ b/tests/queries/0_stateless/02025_storage_filelog_virtual_col.sh
@@ -9,7 +9,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Data preparation.
 # Now we can get the user_files_path by use the table file function for trick. also we can get it by query as:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 
diff --git a/tests/queries/0_stateless/02026_storage_filelog_largefile.sh b/tests/queries/0_stateless/02026_storage_filelog_largefile.sh
index 41a9d82949c..b0a9a4357f3 100755
--- a/tests/queries/0_stateless/02026_storage_filelog_largefile.sh
+++ b/tests/queries/0_stateless/02026_storage_filelog_largefile.sh
@@ -10,7 +10,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Data preparation.
 # Now we can get the user_files_path by use the table file function for trick. also we can get it by query as:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 
diff --git a/tests/queries/0_stateless/02030_capnp_format.sh b/tests/queries/0_stateless/02030_capnp_format.sh
index b4484ca3766..6fcfef23cc7 100755
--- a/tests/queries/0_stateless/02030_capnp_format.sh
+++ b/tests/queries/0_stateless/02030_capnp_format.sh
@@ -5,11 +5,11 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 CAPN_PROTO_FILE=$USER_FILES_PATH/data.capnp
 touch $CAPN_PROTO_FILE
 
-SCHEMADIR=$(clickhouse-client --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
+SCHEMADIR=$($CLICKHOUSE_CLIENT_BINARY --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
 CLIENT_SCHEMADIR=$CURDIR/format_schemas
 SERVER_SCHEMADIR=test_02030
 mkdir -p $SCHEMADIR/$SERVER_SCHEMADIR
diff --git a/tests/queries/0_stateless/02030_tuple_filter.sql b/tests/queries/0_stateless/02030_tuple_filter.sql
index f2fc3a30aa6..1b79ad6c83c 100644
--- a/tests/queries/0_stateless/02030_tuple_filter.sql
+++ b/tests/queries/0_stateless/02030_tuple_filter.sql
@@ -33,6 +33,7 @@ SET force_primary_key = 0;
 
 SELECT * FROM test_tuple_filter WHERE (1, value) = (id, 'A');
 SELECT * FROM test_tuple_filter WHERE tuple(id) = tuple(1);
+SELECT * FROM test_tuple_filter WHERE (id, (id, id) = (1, NULL)) == (NULL, NULL);
 
 SELECT * FROM test_tuple_filter WHERE (log_date, value) = tuple('2021-01-01'); -- { serverError 43 }
 SELECT * FROM test_tuple_filter WHERE (id, value) = tuple(1); -- { serverError 43 }
diff --git a/tests/queries/0_stateless/02041_openssl_hash_functions_test.reference b/tests/queries/0_stateless/02041_openssl_hash_functions_test.reference
index e5298179e6f..948e7913c5f 100644
--- a/tests/queries/0_stateless/02041_openssl_hash_functions_test.reference
+++ b/tests/queries/0_stateless/02041_openssl_hash_functions_test.reference
@@ -6,3 +6,4 @@ A94A8FE5CCB19BA61C4C0873D391E987982FBBD3
 9F86D081884C7D659A2FEAA0C55AD015A3BF4F1B2B0B822CD15D6C15B0F00A08
 768412320F7B0AA5812FCE428DC4706B3CAE50E02A64CAA16A782249BFE8EFC4B7EF1CCB126255D196047DFEDF17A0A9
 EE26B0DD4AF7E749AA1A8EE3C10AE9923F618980772E473F8819A5D4940E0DB27AC185F8A0E1D5F84F88BC887FD67B143732C304CC5FA9AD8E6F57F50028A8FF
+3D37FE58435E0D87323DEE4A2C1B339EF954DE63716EE79F5747F94D974F913F
diff --git a/tests/queries/0_stateless/02041_openssl_hash_functions_test.sql b/tests/queries/0_stateless/02041_openssl_hash_functions_test.sql
index 71940b24af4..7c712cf35fb 100644
--- a/tests/queries/0_stateless/02041_openssl_hash_functions_test.sql
+++ b/tests/queries/0_stateless/02041_openssl_hash_functions_test.sql
@@ -8,3 +8,4 @@ SELECT hex(SHA224('test'));
 SELECT hex(SHA256('test'));
 SELECT hex(SHA384('test'));
 SELECT hex(SHA512('test'));
+SELECT hex(SHA512_256('test'));
diff --git a/tests/queries/0_stateless/02047_log_family_complex_structs_data_file_dumps.sh b/tests/queries/0_stateless/02047_log_family_complex_structs_data_file_dumps.sh
index 015a162221d..55c01e63294 100755
--- a/tests/queries/0_stateless/02047_log_family_complex_structs_data_file_dumps.sh
+++ b/tests/queries/0_stateless/02047_log_family_complex_structs_data_file_dumps.sh
@@ -11,7 +11,7 @@ do
     echo "$engine:"
 
     $CLICKHOUSE_CLIENT --query="DROP TABLE IF EXISTS tbl"
-    $CLICKHOUSE_CLIENT --query="CREATE TABLE tbl(x Array(Array(Int32)), y Array(Tuple(z String, w Float32))) ENGINE=$engine"
+    $CLICKHOUSE_CLIENT --query="CREATE TABLE tbl(x Array(Array(Int32)), y Nested(z String, w Float32)) ENGINE=$engine"
     data_dir=$($CLICKHOUSE_CLIENT --query="SELECT data_paths[1] FROM system.tables WHERE name='tbl' AND database=currentDatabase()")
 
     echo "empty:"
diff --git a/tests/queries/0_stateless/02051_symlinks_to_user_files.sh b/tests/queries/0_stateless/02051_symlinks_to_user_files.sh
index 22d6d2938cd..0af71e4deee 100755
--- a/tests/queries/0_stateless/02051_symlinks_to_user_files.sh
+++ b/tests/queries/0_stateless/02051_symlinks_to_user_files.sh
@@ -6,7 +6,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CUR_DIR"/../shell_config.sh
 
 # See 01658_read_file_to_string_column.sh
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 FILE_PATH="${user_files_path}/file/"
 mkdir -p ${FILE_PATH}
@@ -29,4 +29,3 @@ trap cleanup EXIT
 
 ${CLICKHOUSE_CLIENT} --query="insert into table function file('${symlink_path}', 'Values', 'a String') select 'OK'";
 ${CLICKHOUSE_CLIENT} --query="select * from file('${symlink_path}', 'Values', 'a String') order by a";
-
diff --git a/tests/queries/0_stateless/02096_totals_global_in_bug.sql b/tests/queries/0_stateless/02096_totals_global_in_bug.sql
index ac4f2b9d2ba..27ca26cf141 100644
--- a/tests/queries/0_stateless/02096_totals_global_in_bug.sql
+++ b/tests/queries/0_stateless/02096_totals_global_in_bug.sql
@@ -1,2 +1 @@
-select sum(number) from remote('127.0.0.{2,3}', numbers(2)) where number global in (select sum(number) from numbers(2) group by number with totals) group by number with totals
-
+select sum(number) from remote('127.0.0.{2,3}', numbers(2)) where number global in (select sum(number) from numbers(2) group by number with totals) group by number with totals order by number;
diff --git a/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.reference b/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.reference
index 6e88bbad146..41b9ab687f8 100644
--- a/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.reference
+++ b/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.reference
@@ -26,6 +26,62 @@ select all values as input stream
 0	value_0	value_second_0
 1	value_1	value_second_1
 2	value_2	value_second_2
+Dictionary hashed_array_dictionary_simple_key_simple_attributes
+dictGet existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+dictGet with non existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+value_first_default	value_second_default
+dictGetOrDefault existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+dictGetOrDefault non existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+default	default
+dictHas
+1
+1
+1
+0
+select all values as input stream
+0	value_0	value_second_0
+1	value_1	value_second_1
+2	value_2	value_second_2
+Dictionary hashed_array_dictionary_simple_key_complex_attributes
+dictGet existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+dictGet with non existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+value_first_default	value_second_default
+dictGetOrDefault existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+dictGetOrDefault non existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+default	default
+dictHas
+1
+1
+1
+0
+select all values as input stream
+0	value_0	value_second_0
+1	value_1	\N
+2	value_2	value_second_2
 Dictionary hashed_array_dictionary_simple_key_complex_attributes
 dictGet existing value
 value_0	value_second_0
@@ -64,3 +120,13 @@ dictGet
 dictGetHierarchy
 [1]
 [4,2,1]
+Dictionary hashed_array_dictionary_simple_key_hierarchy
+dictGet
+0
+0
+1
+1
+2
+dictGetHierarchy
+[1]
+[4,2,1]
diff --git a/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql b/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql.j2
similarity index 95%
rename from tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql
rename to tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql.j2
index 7d952223705..e5d8ad36c6d 100644
--- a/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql
+++ b/tests/queries/0_stateless/02098_hashed_array_dictionary_simple_key.sql.j2
@@ -11,6 +11,8 @@ INSERT INTO simple_key_simple_attributes_source_table VALUES(0, 'value_0', 'valu
 INSERT INTO simple_key_simple_attributes_source_table VALUES(1, 'value_1', 'value_second_1');
 INSERT INTO simple_key_simple_attributes_source_table VALUES(2, 'value_2', 'value_second_2');
 
+{% for dictionary_config in ['', 'SHARDS 16'] -%}
+
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_simple_key_simple_attributes;
 CREATE DICTIONARY hashed_array_dictionary_simple_key_simple_attributes
 (
@@ -20,7 +22,7 @@ CREATE DICTIONARY hashed_array_dictionary_simple_key_simple_attributes
 )
 PRIMARY KEY id
 SOURCE(CLICKHOUSE(TABLE 'simple_key_simple_attributes_source_table'))
-LAYOUT(HASHED_ARRAY())
+LAYOUT(HASHED_ARRAY({{ dictionary_config }}))
 LIFETIME(MIN 1 MAX 1000)
 SETTINGS(dictionary_use_async_executor=1, max_threads=8);
 
@@ -43,6 +45,7 @@ SELECT 'select all values as input stream';
 SELECT * FROM hashed_array_dictionary_simple_key_simple_attributes ORDER BY id;
 
 DROP DICTIONARY hashed_array_dictionary_simple_key_simple_attributes;
+{% endfor %}
 
 DROP TABLE simple_key_simple_attributes_source_table;
 
@@ -59,6 +62,8 @@ INSERT INTO simple_key_complex_attributes_source_table VALUES(0, 'value_0', 'val
 INSERT INTO simple_key_complex_attributes_source_table VALUES(1, 'value_1', NULL);
 INSERT INTO simple_key_complex_attributes_source_table VALUES(2, 'value_2', 'value_second_2');
 
+{% for dictionary_config in ['', 'SHARDS 16'] -%}
+
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_simple_key_complex_attributes;
 CREATE DICTIONARY hashed_array_dictionary_simple_key_complex_attributes
 (
@@ -68,7 +73,7 @@ CREATE DICTIONARY hashed_array_dictionary_simple_key_complex_attributes
 )
 PRIMARY KEY id
 SOURCE(CLICKHOUSE(TABLE 'simple_key_complex_attributes_source_table'))
-LAYOUT(HASHED_ARRAY())
+LAYOUT(HASHED_ARRAY({{ dictionary_config }}))
 LIFETIME(MIN 1 MAX 1000);
 
 SELECT 'Dictionary hashed_array_dictionary_simple_key_complex_attributes';
@@ -90,6 +95,9 @@ SELECT 'select all values as input stream';
 SELECT * FROM hashed_array_dictionary_simple_key_complex_attributes ORDER BY id;
 
 DROP DICTIONARY hashed_array_dictionary_simple_key_complex_attributes;
+
+{% endfor %}
+
 DROP TABLE simple_key_complex_attributes_source_table;
 
 DROP TABLE IF EXISTS simple_key_hierarchy_table;
@@ -104,6 +112,8 @@ INSERT INTO simple_key_hierarchy_table VALUES (2, 1);
 INSERT INTO simple_key_hierarchy_table VALUES (3, 1);
 INSERT INTO simple_key_hierarchy_table VALUES (4, 2);
 
+{% for dictionary_config in ['', 'SHARDS 16'] -%}
+
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_simple_key_hierarchy;
 CREATE DICTIONARY hashed_array_dictionary_simple_key_hierarchy
 (
@@ -112,7 +122,7 @@ CREATE DICTIONARY hashed_array_dictionary_simple_key_hierarchy
 )
 PRIMARY KEY id
 SOURCE(CLICKHOUSE(HOST 'localhost' PORT tcpPort() USER 'default' TABLE 'simple_key_hierarchy_table'))
-LAYOUT(HASHED_ARRAY())
+LAYOUT(HASHED_ARRAY({{ dictionary_config }}))
 LIFETIME(MIN 1 MAX 1000);
 
 SELECT 'Dictionary hashed_array_dictionary_simple_key_hierarchy';
@@ -122,5 +132,8 @@ SELECT 'dictGetHierarchy';
 SELECT dictGetHierarchy('hashed_array_dictionary_simple_key_hierarchy', toUInt64(1));
 SELECT dictGetHierarchy('hashed_array_dictionary_simple_key_hierarchy', toUInt64(4));
 
+{% endfor %}
+
 DROP DICTIONARY hashed_array_dictionary_simple_key_hierarchy;
+
 DROP TABLE simple_key_hierarchy_table;
diff --git a/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.reference b/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.reference
index ec32fa72b4e..13a7548b86f 100644
--- a/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.reference
+++ b/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.reference
@@ -26,6 +26,62 @@ select all values as input stream
 0	id_key_0	value_0	value_second_0
 1	id_key_1	value_1	value_second_1
 2	id_key_2	value_2	value_second_2
+Dictionary hashed_array_dictionary_complex_key_simple_attributes
+dictGet existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+dictGet with non existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+value_first_default	value_second_default
+dictGetOrDefault existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+dictGetOrDefault non existing value
+value_0	value_second_0
+value_1	value_second_1
+value_2	value_second_2
+default	default
+dictHas
+1
+1
+1
+0
+select all values as input stream
+0	id_key_0	value_0	value_second_0
+1	id_key_1	value_1	value_second_1
+2	id_key_2	value_2	value_second_2
+Dictionary hashed_array_dictionary_complex_key_complex_attributes
+dictGet existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+dictGet with non existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+value_first_default	value_second_default
+dictGetOrDefault existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+dictGetOrDefault non existing value
+value_0	value_second_0
+value_1	\N
+value_2	value_second_2
+default	default
+dictHas
+1
+1
+1
+0
+select all values as input stream
+0	id_key_0	value_0	value_second_0
+1	id_key_1	value_1	\N
+2	id_key_2	value_2	value_second_2
 Dictionary hashed_array_dictionary_complex_key_complex_attributes
 dictGet existing value
 value_0	value_second_0
diff --git a/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql b/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql.j2
similarity index 96%
rename from tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql
rename to tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql.j2
index 4d2a825c8af..56f9b264a62 100644
--- a/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql
+++ b/tests/queries/0_stateless/02099_hashed_array_dictionary_complex_key.sql.j2
@@ -12,6 +12,8 @@ INSERT INTO complex_key_simple_attributes_source_table VALUES(0, 'id_key_0', 'va
 INSERT INTO complex_key_simple_attributes_source_table VALUES(1, 'id_key_1', 'value_1', 'value_second_1');
 INSERT INTO complex_key_simple_attributes_source_table VALUES(2, 'id_key_2', 'value_2', 'value_second_2');
 
+{% for dictionary_config in ['', 'SHARDS 16'] -%}
+
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_complex_key_simple_attributes;
 CREATE DICTIONARY hashed_array_dictionary_complex_key_simple_attributes
 (
@@ -23,7 +25,7 @@ CREATE DICTIONARY hashed_array_dictionary_complex_key_simple_attributes
 PRIMARY KEY id, id_key
 SOURCE(CLICKHOUSE(TABLE 'complex_key_simple_attributes_source_table'))
 LIFETIME(MIN 1 MAX 1000)
-LAYOUT(COMPLEX_KEY_HASHED_ARRAY());
+LAYOUT(COMPLEX_KEY_HASHED_ARRAY({{ dictionary_config }}));
 
 SELECT 'Dictionary hashed_array_dictionary_complex_key_simple_attributes';
 SELECT 'dictGet existing value';
@@ -45,6 +47,8 @@ SELECT * FROM hashed_array_dictionary_complex_key_simple_attributes ORDER BY (id
 
 DROP DICTIONARY hashed_array_dictionary_complex_key_simple_attributes;
 
+{% endfor %}
+
 DROP TABLE complex_key_simple_attributes_source_table;
 
 DROP TABLE IF EXISTS complex_key_complex_attributes_source_table;
@@ -61,6 +65,8 @@ INSERT INTO complex_key_complex_attributes_source_table VALUES(0, 'id_key_0', 'v
 INSERT INTO complex_key_complex_attributes_source_table VALUES(1, 'id_key_1', 'value_1', NULL);
 INSERT INTO complex_key_complex_attributes_source_table VALUES(2, 'id_key_2', 'value_2', 'value_second_2');
 
+{% for dictionary_config in ['', 'SHARDS 16'] -%}
+
 DROP DICTIONARY IF EXISTS hashed_array_dictionary_complex_key_complex_attributes;
 CREATE DICTIONARY hashed_array_dictionary_complex_key_complex_attributes
 (
@@ -73,7 +79,7 @@ CREATE DICTIONARY hashed_array_dictionary_complex_key_complex_attributes
 PRIMARY KEY id, id_key
 SOURCE(CLICKHOUSE(TABLE 'complex_key_complex_attributes_source_table'))
 LIFETIME(MIN 1 MAX 1000)
-LAYOUT(COMPLEX_KEY_HASHED_ARRAY());
+LAYOUT(COMPLEX_KEY_HASHED_ARRAY({{ dictionary_config }}));
 
 SELECT 'Dictionary hashed_array_dictionary_complex_key_complex_attributes';
 SELECT 'dictGet existing value';
@@ -93,5 +99,7 @@ SELECT dictHas('hashed_array_dictionary_complex_key_complex_attributes', (number
 SELECT 'select all values as input stream';
 SELECT * FROM hashed_array_dictionary_complex_key_complex_attributes ORDER BY (id, id_key);
 
+{% endfor %}
+
 DROP DICTIONARY hashed_array_dictionary_complex_key_complex_attributes;
 DROP TABLE complex_key_complex_attributes_source_table;
diff --git a/tests/queries/0_stateless/02104_json_strings_nullable_string.sh b/tests/queries/0_stateless/02104_json_strings_nullable_string.sh
index 6a5d369e7b6..b3b156b5787 100755
--- a/tests/queries/0_stateless/02104_json_strings_nullable_string.sh
+++ b/tests/queries/0_stateless/02104_json_strings_nullable_string.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 DATA_FILE=$USER_FILES_PATH/test_02104_null.data
 
 echo -e '{"s" : "NULLSome string"}' > $DATA_FILE
@@ -15,4 +15,3 @@ echo -e '["NULLSome string"]' > $DATA_FILE
 $CLICKHOUSE_CLIENT -q "SELECT * FROM file('test_02104_null.data', 'JSONCompactStringsEachRow', 's Nullable(String)')"
 
 rm $DATA_FILE
-
diff --git a/tests/queries/0_stateless/02105_table_function_file_partiotion_by.sh b/tests/queries/0_stateless/02105_table_function_file_partiotion_by.sh
index c96725845d7..c79b5d0eee5 100755
--- a/tests/queries/0_stateless/02105_table_function_file_partiotion_by.sh
+++ b/tests/queries/0_stateless/02105_table_function_file_partiotion_by.sh
@@ -6,7 +6,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CUR_DIR"/../shell_config.sh
 
 # See 01658_read_file_to_string_column.sh
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p "${user_files_path}/"
 chmod 777 ${user_files_path}
@@ -27,4 +27,3 @@ echo 'part 2'
 ${CLICKHOUSE_CLIENT} --query="select * from file('${FILE_PATH}/2/test_2', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')";
 echo 'part 3'
 ${CLICKHOUSE_CLIENT} --query="select * from file('${FILE_PATH}/3/test_3', 'TSV', 'column1 UInt32, column2 UInt32, column3 UInt32')";
-
diff --git a/tests/queries/0_stateless/02117_show_create_table_system.reference b/tests/queries/0_stateless/02117_show_create_table_system.reference
index 9ed905a0df8..e89d589857e 100644
--- a/tests/queries/0_stateless/02117_show_create_table_system.reference
+++ b/tests/queries/0_stateless/02117_show_create_table_system.reference
@@ -406,6 +406,7 @@ CREATE TABLE system.mutations
     `parts_to_do_names` Array(String),
     `parts_to_do` Int64,
     `is_done` UInt8,
+    `is_killed` UInt8,
     `latest_failed_part` String,
     `latest_fail_time` DateTime,
     `latest_fail_reason` String
@@ -1086,6 +1087,7 @@ CREATE TABLE system.tables
     `storage_policy` String,
     `total_rows` Nullable(UInt64),
     `total_bytes` Nullable(UInt64),
+    `total_bytes_uncompressed` Nullable(UInt64),
     `parts` Nullable(UInt64),
     `active_parts` Nullable(UInt64),
     `total_marks` Nullable(UInt64),
diff --git a/tests/queries/0_stateless/02118_deserialize_whole_text.sh b/tests/queries/0_stateless/02118_deserialize_whole_text.sh
index d4702887e7f..ccbfc5abe97 100755
--- a/tests/queries/0_stateless/02118_deserialize_whole_text.sh
+++ b/tests/queries/0_stateless/02118_deserialize_whole_text.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 DATA_FILE=$USER_FILES_PATH/data_02118
 
 echo "[\"[1,2,3]trash\"]" > $DATA_FILE
@@ -63,4 +63,3 @@ echo "[\"ed9fd45d-6287-47c1-ad9f-d45d628767c1trash\"]" > $DATA_FILE
 $CLICKHOUSE_CLIENT -q "SELECT * FROM file('data_02118', 'JSONCompactStringsEachRow', 'x UUID')" 2>&1 | grep -F -q "UNEXPECTED_DATA_AFTER_PARSED_VALUE" && echo 'OK' || echo 'FAIL'
 
 rm $DATA_FILE
-
diff --git a/tests/queries/0_stateless/02125_tskv_proper_names_reading.sh b/tests/queries/0_stateless/02125_tskv_proper_names_reading.sh
index 49c895329d6..0abf411d38f 100755
--- a/tests/queries/0_stateless/02125_tskv_proper_names_reading.sh
+++ b/tests/queries/0_stateless/02125_tskv_proper_names_reading.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 DATA_FILE=$USER_FILES_PATH/test_02125.data
 
diff --git a/tests/queries/0_stateless/02126_fix_filelog.sh b/tests/queries/0_stateless/02126_fix_filelog.sh
index ac2e9d1bd19..b266b582428 100755
--- a/tests/queries/0_stateless/02126_fix_filelog.sh
+++ b/tests/queries/0_stateless/02126_fix_filelog.sh
@@ -9,7 +9,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Data preparation.
 # Now we can get the user_files_path by use the table file function for trick. also we can get it by query as:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
 
diff --git a/tests/queries/0_stateless/02130_parse_quoted_null.sh b/tests/queries/0_stateless/02130_parse_quoted_null.sh
index 2da62f9a4ff..0c72d0e85a7 100755
--- a/tests/queries/0_stateless/02130_parse_quoted_null.sh
+++ b/tests/queries/0_stateless/02130_parse_quoted_null.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 DATA_FILE=$USER_FILES_PATH/test_02130.data
 SELECT_QUERY="select * from file('test_02130.data', 'CustomSeparated', 'x Nullable(Float64), y Nullable(UInt64)') settings input_format_parallel_parsing=0, format_custom_escaping_rule='Quoted'"
 
diff --git a/tests/queries/0_stateless/02141_clickhouse_local_interactive_table.reference b/tests/queries/0_stateless/02141_clickhouse_local_interactive_table.reference
index 4c1d5dc829f..beda9e36223 100644
--- a/tests/queries/0_stateless/02141_clickhouse_local_interactive_table.reference
+++ b/tests/queries/0_stateless/02141_clickhouse_local_interactive_table.reference
@@ -1,2 +1,2 @@
-CREATE TABLE _local.table\n(\n    `key` String\n)\nENGINE = File(\'TSVWithNamesAndTypes\', \'/dev/null\')
+CREATE TABLE default.table\n(\n    `key` String\n)\nENGINE = File(\'TSVWithNamesAndTypes\', \'/dev/null\')
 CREATE TABLE foo.table\n(\n    `key` String\n)\nENGINE = File(\'TSVWithNamesAndTypes\', \'/dev/null\')
diff --git a/tests/queries/0_stateless/02149_external_schema_inference.sh b/tests/queries/0_stateless/02149_external_schema_inference.sh
index 5e03120c80f..41f8bfee2bc 100755
--- a/tests/queries/0_stateless/02149_external_schema_inference.sh
+++ b/tests/queries/0_stateless/02149_external_schema_inference.sh
@@ -6,13 +6,13 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_$CLICKHOUSE_TEST_UNIQUE_NAME.data
 DATA_FILE=$USER_FILES_PATH/$FILE_NAME
 
 touch $DATA_FILE
 
-SCHEMADIR=$(clickhouse-client --query "select * from file('$FILE_NAME', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
+SCHEMADIR=$($CLICKHOUSE_CLIENT_BINARY --query "select * from file('$FILE_NAME', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
 CLIENT_SCHEMADIR=$CURDIR/format_schemas
 SERVER_SCHEMADIR=test_02149
 mkdir -p $SCHEMADIR/$SERVER_SCHEMADIR
diff --git a/tests/queries/0_stateless/02149_schema_inference.sh b/tests/queries/0_stateless/02149_schema_inference.sh
index b2cc662706c..856549f2215 100755
--- a/tests/queries/0_stateless/02149_schema_inference.sh
+++ b/tests/queries/0_stateless/02149_schema_inference.sh
@@ -6,13 +6,13 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_$CLICKHOUSE_TEST_UNIQUE_NAME.data
 DATA_FILE=${USER_FILES_PATH:?}/$FILE_NAME
 
 touch $DATA_FILE
 
-SCHEMADIR=$(clickhouse-client --query "select * from file('$FILE_NAME', 'Template', 'val1 char') settings format_template_row='nonexist'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist)")
+SCHEMADIR=$($CLICKHOUSE_CLIENT_BINARY --query "select * from file('$FILE_NAME', 'Template', 'val1 char') settings format_template_row='nonexist'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist)")
 
 echo "TSV"
 
@@ -248,4 +248,3 @@ $CLICKHOUSE_CLIENT -q "select * from file('$FILE_NAME', 'MsgPack') settings inpu
 
 rm $SCHEMADIR/resultset_format_02149 $SCHEMADIR/row_format_02149
 rm $DATA_FILE
-
diff --git a/tests/queries/0_stateless/02149_schema_inference_create_table_syntax.sh b/tests/queries/0_stateless/02149_schema_inference_create_table_syntax.sh
index f00f2531dd0..8de2ab8c57a 100755
--- a/tests/queries/0_stateless/02149_schema_inference_create_table_syntax.sh
+++ b/tests/queries/0_stateless/02149_schema_inference_create_table_syntax.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 mkdir $USER_FILES_PATH/test_02149
 FILE_NAME=test_02149/data.Parquet
 DATA_FILE=$USER_FILES_PATH/$FILE_NAME
@@ -37,4 +37,3 @@ $CLICKHOUSE_CLIENT -q "select * from test_buffer"
 $CLICKHOUSE_CLIENT -q "drop table test_buffer"
 
 rm -rf ${USER_FILES_PATH:?}/test_02149
-
diff --git a/tests/queries/0_stateless/02163_shard_num.reference b/tests/queries/0_stateless/02163_shard_num.reference
index 77eea7c95b9..d79b95024f6 100644
--- a/tests/queries/0_stateless/02163_shard_num.reference
+++ b/tests/queries/0_stateless/02163_shard_num.reference
@@ -1,18 +1,18 @@
 -- { echoOn }
 
-SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num;
-2	1
+SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num ORDER BY _shard_num;
 1	1
-SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num;
 2	1
+SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num ORDER BY shard_num;
 1	1
-SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num;
 2	1
+SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num ORDER BY _shard_num;
 1	1
-SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num;
 2	1
+SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num ORDER BY shard_num;
 1	1
-SELECT a._shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) a GROUP BY shard_num;
 2	1
+SELECT a._shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) a GROUP BY shard_num ORDER BY shard_num;
 1	1
+2	1
 SELECT _shard_num FROM remote('127.1', system.one) AS a INNER JOIN (SELECT _shard_num FROM system.one) AS b USING (dummy); -- { serverError UNSUPPORTED_METHOD, UNKNOWN_IDENTIFIER }
diff --git a/tests/queries/0_stateless/02163_shard_num.sql b/tests/queries/0_stateless/02163_shard_num.sql
index cc87140ebaf..d3b4a95c6a8 100644
--- a/tests/queries/0_stateless/02163_shard_num.sql
+++ b/tests/queries/0_stateless/02163_shard_num.sql
@@ -1,10 +1,10 @@
 -- { echoOn }
 
-SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num;
-SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num;
-SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num;
-SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num;
-SELECT a._shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) a GROUP BY shard_num;
+SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num ORDER BY _shard_num;
+SELECT shardNum() AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num ORDER BY shard_num;
+SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY _shard_num ORDER BY _shard_num;
+SELECT _shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) GROUP BY shard_num ORDER BY shard_num;
+SELECT a._shard_num AS shard_num, sum(1) as rows FROM remote('127.{1,2}', system, one) a GROUP BY shard_num ORDER BY shard_num;
 SELECT _shard_num FROM remote('127.1', system.one) AS a INNER JOIN (SELECT _shard_num FROM system.one) AS b USING (dummy); -- { serverError UNSUPPORTED_METHOD, UNKNOWN_IDENTIFIER }
 
 -- { echoOff }
diff --git a/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference b/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference
index 055c88160ad..8ec3608317f 100644
--- a/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference
+++ b/tests/queries/0_stateless/02174_cte_scalar_cache_mv.reference
@@ -18,7 +18,7 @@
 89	89	89	89	5
 94	94	94	94	5
 99	99	99	99	5
-02177_MV	3	80	26
+02177_MV	7	80	22
 10
 40
 70
@@ -60,4 +60,4 @@
 178
 188
 198
-02177_MV_3	19	0	2
+02177_MV_3	20	0	1
diff --git a/tests/queries/0_stateless/02178_column_function_insert_from.sql b/tests/queries/0_stateless/02178_column_function_insert_from.sql
index 13d1ebb4788..fc692ec859c 100644
--- a/tests/queries/0_stateless/02178_column_function_insert_from.sql
+++ b/tests/queries/0_stateless/02178_column_function_insert_from.sql
@@ -8,6 +8,9 @@ INSERT INTO TESTTABLE values (0,'0',['1']), (1,'1',['1']);
 
 SET max_threads = 1;
 
+-- There is a bug which is fixed in new analyzer.
+SET max_bytes_before_external_sort = 0;
+
 SELECT attr, _id, arrayFilter(x -> (x IN (select '1')), attr_list) z
 FROM TESTTABLE ARRAY JOIN z AS attr ORDER BY _id LIMIT 3 BY attr;
 
diff --git a/tests/queries/0_stateless/02184_hash_functions_and_ip_types.reference b/tests/queries/0_stateless/02184_hash_functions_and_ip_types.reference
index b305806cd08..aad21567fca 100644
--- a/tests/queries/0_stateless/02184_hash_functions_and_ip_types.reference
+++ b/tests/queries/0_stateless/02184_hash_functions_and_ip_types.reference
@@ -34,6 +34,7 @@ hex(SHA1(ipv6)):            A6D5DCE882AC44804382DE4639E6001612E1C8B5
 hex(SHA224(ipv6)):          F6995FD7BED2BCA21F68DAC6BBABE742DC1BA177BA8594CEF1715C52
 hex(SHA256(ipv6)):          F75497BAD6F7747BD6B150B6F69BA2DEE354F1C2A34B7BEA6183973B78640250
 hex(SHA512(ipv6)):          0C2893CCBF44BC19CCF339AEED5B68CBFD5A2EF38263A48FE21C3379BA4438E7FF7A02F59D7542442C6E6ED538E6D13D65D3573DADB381651D3D8A5DEA232EAC
+hex(SHA512_256(ipv6)):      1A2248FEB5A9D2D8D6C2482F132CFC19448B59DE75358E1F7ECAF444004F85A3
 farmFingerprint64(ipv6):    6643158734288374888
 javaHash(ipv6):             684606770
 xxh3(ipv6):                 4051340969481364358
diff --git a/tests/queries/0_stateless/02184_hash_functions_and_ip_types.sql b/tests/queries/0_stateless/02184_hash_functions_and_ip_types.sql
index d96574ef4fe..c90c8b90c9e 100644
--- a/tests/queries/0_stateless/02184_hash_functions_and_ip_types.sql
+++ b/tests/queries/0_stateless/02184_hash_functions_and_ip_types.sql
@@ -38,6 +38,7 @@ SELECT
     hex(SHA224(ipv6)),
     hex(SHA256(ipv6)),
     hex(SHA512(ipv6)),
+    hex(SHA512_256(ipv6)),
     farmFingerprint64(ipv6),
     javaHash(ipv6),
     xxh3(ipv6),
diff --git a/tests/queries/0_stateless/02185_orc_corrupted_file.sh b/tests/queries/0_stateless/02185_orc_corrupted_file.sh
index c5f5e8710ca..1987f094faa 100755
--- a/tests/queries/0_stateless/02185_orc_corrupted_file.sh
+++ b/tests/queries/0_stateless/02185_orc_corrupted_file.sh
@@ -5,7 +5,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 cp $CUR_DIR/data_orc/corrupted.orc $USER_FILES_PATH/
 
 ${CLICKHOUSE_CLIENT} --query="select * from file('corrupted.orc')" 2>&1 | grep -F -q 'Cannot extract table structure' && echo 'OK' || echo 'FAIL'
diff --git a/tests/queries/0_stateless/02185_substring_negative_offset_size.reference b/tests/queries/0_stateless/02185_substring_negative_offset_size.reference
deleted file mode 100644
index 107f083a4d8..00000000000
--- a/tests/queries/0_stateless/02185_substring_negative_offset_size.reference
+++ /dev/null
@@ -1,31 +0,0 @@
-
-
-
-g
-g
-g
--
-
-
-
-g
-g
-g
--
-
-
-
-6
-
-
-
-
--
-
-
-
-6
-
-
-
-
diff --git a/tests/queries/0_stateless/02185_substring_negative_offset_size.sql b/tests/queries/0_stateless/02185_substring_negative_offset_size.sql
deleted file mode 100644
index 715dff30369..00000000000
--- a/tests/queries/0_stateless/02185_substring_negative_offset_size.sql
+++ /dev/null
@@ -1,48 +0,0 @@
-select substring('abcdefgh', -2, -2);
-select substring(materialize('abcdefgh'), -2, -2);
-select substring(materialize('abcdefgh'), materialize(-2), materialize(-2));
-
-select substring('abcdefgh', -2, -1);
-select substring(materialize('abcdefgh'), -2, -1);
-select substring(materialize('abcdefgh'), materialize(-2), materialize(-1));
-
-select '-';
-select substring(cast('abcdefgh' as FixedString(8)), -2, -2);
-select substring(materialize(cast('abcdefgh' as FixedString(8))), -2, -2);
-select substring(materialize(cast('abcdefgh' as FixedString(8))), materialize(-2), materialize(-2));
-
-select substring(cast('abcdefgh' as FixedString(8)), -2, -1);
-select substring(materialize(cast('abcdefgh' as FixedString(8))), -2, -1);
-select substring(materialize(cast('abcdefgh' as FixedString(8))), materialize(-2), materialize(-1));
-
-select '-';
-drop table if exists t;
-create table t
-(
-    s String,
-    l Int8,
-    r Int8
-) engine = Memory;
-
-insert into t values ('abcdefgh', -2, -2),('12345678', -3, -3);
-
-select substring(s, -2, -2) from t;
-select substring(s, l, -2) from t;
-select substring(s, -2, r) from t;
-select substring(s, l, r) from t;
-
-select '-';
-drop table if exists t;
-create table t(
-                  s FixedString(8),
-                  l Int8,
-                  r Int8
-) engine = Memory;
-insert into t values ('abcdefgh', -2, -2),('12345678', -3, -3);
-
-select substring(s, -2, -2) from t;
-select substring(s, l, -2) from t;
-select substring(s, -2, r) from t;
-select substring(s, l, r) from t;
-
-drop table if exists t;
diff --git a/tests/queries/0_stateless/02222_create_table_without_columns_metadata.sh b/tests/queries/0_stateless/02222_create_table_without_columns_metadata.sh
index 9cb4fb939e7..d49c3610852 100755
--- a/tests/queries/0_stateless/02222_create_table_without_columns_metadata.sh
+++ b/tests/queries/0_stateless/02222_create_table_without_columns_metadata.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 $CLICKHOUSE_CLIENT -q "insert into table function file(data.jsonl, 'JSONEachRow', 'x UInt32 default 42, y String') select number as x, 'String' as y from numbers(10)"
 
@@ -30,4 +30,3 @@ $CLICKHOUSE_CLIENT -q "detach table test_dist"
 $CLICKHOUSE_CLIENT -q "drop table test"
 $CLICKHOUSE_CLIENT -q "attach table test_dist"
 $CLICKHOUSE_CLIENT --prefer_localhost_replica=1 -q "select * from test_dist" 2>&1 | grep -q "UNKNOWN_TABLE" && echo "OK" || echo "FAIL"
-
diff --git a/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh b/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh
index 941f024825a..bc90f4b2c11 100755
--- a/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh
+++ b/tests/queries/0_stateless/02226_parallel_reading_from_replicas_benchmark.sh
@@ -17,7 +17,6 @@ opts=(
     --allow_experimental_parallel_reading_from_replicas 1
     --parallel_replicas_for_non_replicated_merge_tree 1
     --max_parallel_replicas 3
-    --use_hedged_requests 0
     --cluster_for_parallel_replicas parallel_replicas
 
     --iterations 1
diff --git a/tests/queries/0_stateless/02227_test_create_empty_sqlite_db.sh b/tests/queries/0_stateless/02227_test_create_empty_sqlite_db.sh
index 253d3f3149d..39ba17fc7eb 100755
--- a/tests/queries/0_stateless/02227_test_create_empty_sqlite_db.sh
+++ b/tests/queries/0_stateless/02227_test_create_empty_sqlite_db.sh
@@ -6,7 +6,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CUR_DIR"/../shell_config.sh
 
 # See 01658_read_file_to_string_column.sh
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 function cleanup()
 {
diff --git a/tests/queries/0_stateless/02240_tskv_schema_inference_bug.sh b/tests/queries/0_stateless/02240_tskv_schema_inference_bug.sh
index 8655ffd1e1f..ce545a27317 100755
--- a/tests/queries/0_stateless/02240_tskv_schema_inference_bug.sh
+++ b/tests/queries/0_stateless/02240_tskv_schema_inference_bug.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_02240.data
 DATA_FILE=${USER_FILES_PATH:?}/$FILE_NAME
 
@@ -19,4 +19,3 @@ a=\N
 c=[3]\ta=\N'  > $DATA_FILE
 $CLICKHOUSE_CLIENT --max_read_buffer_size=4 -q "desc file('$FILE_NAME', 'TSKV')"
 $CLICKHOUSE_CLIENT --max_read_buffer_size=4 -q "select * from file('$FILE_NAME', 'TSKV')"
-
diff --git a/tests/queries/0_stateless/02242_arrow_orc_parquet_nullable_schema_inference.sh b/tests/queries/0_stateless/02242_arrow_orc_parquet_nullable_schema_inference.sh
index 1b6999e3f09..e03c62cfc5f 100755
--- a/tests/queries/0_stateless/02242_arrow_orc_parquet_nullable_schema_inference.sh
+++ b/tests/queries/0_stateless/02242_arrow_orc_parquet_nullable_schema_inference.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_02242.data
 DATA_FILE=$USER_FILES_PATH/$FILE_NAME
 
diff --git a/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh b/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh
index 1e416f23b69..954e2e83f27 100755
--- a/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh
+++ b/tests/queries/0_stateless/02245_parquet_skip_unknown_type.sh
@@ -5,11 +5,11 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_02245.parquet
 DATA_FILE=$USER_FILES_PATH/$FILE_NAME
 
-cp $CUR_DIR/data_parquet_bad_column/metadata_0.parquet $DATA_FILE 
+cp $CUR_DIR/data_parquet_bad_column/metadata_0.parquet $DATA_FILE
 
 
 $CLICKHOUSE_CLIENT -q "desc file(test_02245.parquet)" 2>&1 | grep -qF "Cannot extract table structure" && echo "OK" || echo "FAIL"
diff --git a/tests/queries/0_stateless/02246_tsv_csv_best_effort_schema_inference.sh b/tests/queries/0_stateless/02246_tsv_csv_best_effort_schema_inference.sh
index e8aa5914912..233db7a534d 100755
--- a/tests/queries/0_stateless/02246_tsv_csv_best_effort_schema_inference.sh
+++ b/tests/queries/0_stateless/02246_tsv_csv_best_effort_schema_inference.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_02149.data
 DATA_FILE=${USER_FILES_PATH:?}/$FILE_NAME
 
@@ -218,5 +218,3 @@ echo -e "\"[(1, 2, 3)]\""> $DATA_FILE
 
 $CLIENT_CMD -q "desc file('$FILE_NAME', 'CSV')"
 $CLIENT_CMD -q "select * from file('$FILE_NAME', 'CSV')"
-
-
diff --git a/tests/queries/0_stateless/02247_names_order_in_json_and_tskv.sh b/tests/queries/0_stateless/02247_names_order_in_json_and_tskv.sh
index 0be26371585..e8e3bf88ac4 100755
--- a/tests/queries/0_stateless/02247_names_order_in_json_and_tskv.sh
+++ b/tests/queries/0_stateless/02247_names_order_in_json_and_tskv.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_02247.data
 DATA_FILE=${USER_FILES_PATH:?}/$FILE_NAME
 
diff --git a/tests/queries/0_stateless/02247_read_bools_as_numbers_json.sh b/tests/queries/0_stateless/02247_read_bools_as_numbers_json.sh
index 1b689aaf577..523b5934543 100755
--- a/tests/queries/0_stateless/02247_read_bools_as_numbers_json.sh
+++ b/tests/queries/0_stateless/02247_read_bools_as_numbers_json.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILE_NAME=test_02247.data
 DATA_FILE=${USER_FILES_PATH:?}/$FILE_NAME
 
diff --git a/tests/queries/0_stateless/02286_mysql_dump_input_format.sh b/tests/queries/0_stateless/02286_mysql_dump_input_format.sh
index 1139c1ea68c..a3711497ae8 100755
--- a/tests/queries/0_stateless/02286_mysql_dump_input_format.sh
+++ b/tests/queries/0_stateless/02286_mysql_dump_input_format.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 cp $CURDIR/data_mysql_dump/dump*.sql $USER_FILES_PATH
 
diff --git a/tests/queries/0_stateless/02286_parallel_final.reference b/tests/queries/0_stateless/02286_parallel_final.reference
index f6573cb9042..5801fb46908 100644
--- a/tests/queries/0_stateless/02286_parallel_final.reference
+++ b/tests/queries/0_stateless/02286_parallel_final.reference
@@ -1,9 +1,13 @@
+Test intersecting ranges
 2
 2
 3
 5
-8
-8
-8
-8
-8
+Test intersecting ranges finished
+Test non intersecting ranges
+0
+0
+0
+0
+0
+Test non intersecting ranges finished
diff --git a/tests/queries/0_stateless/02286_parallel_final.sh b/tests/queries/0_stateless/02286_parallel_final.sh
index de0cca0e966..0ac510208f3 100755
--- a/tests/queries/0_stateless/02286_parallel_final.sh
+++ b/tests/queries/0_stateless/02286_parallel_final.sh
@@ -5,13 +5,17 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
+echo "Test intersecting ranges"
+
 test_random_values() {
   layers=$1
   $CLICKHOUSE_CLIENT -n -q "
+    drop table if exists tbl_8parts_${layers}granules_rnd;
     create table tbl_8parts_${layers}granules_rnd (key1 UInt32, sign Int8) engine = CollapsingMergeTree(sign) order by (key1) partition by (key1 % 8);
     insert into tbl_8parts_${layers}granules_rnd select number, 1 from numbers_mt($((layers * 8 * 8192)));
     optimize table tbl_8parts_${layers}granules_rnd final;
-    explain pipeline select * from tbl_8parts_${layers}granules_rnd final settings max_threads = 16;" 2>&1 |
+    explain pipeline select * from tbl_8parts_${layers}granules_rnd final settings max_threads = 16, do_not_merge_across_partitions_select_final = 0;
+    drop table tbl_8parts_${layers}granules_rnd;" 2>&1 |
        grep -c "CollapsingSortedTransform"
 }
 
@@ -19,16 +23,24 @@ for layers in 2 3 5 8; do
   test_random_values $layers
 done;
 
+echo "Test intersecting ranges finished"
+
+echo "Test non intersecting ranges"
+
 test_sequential_values() {
   layers=$1
   $CLICKHOUSE_CLIENT -n -q "
+    drop table if exists tbl_8parts_${layers}granules_seq;
     create table tbl_8parts_${layers}granules_seq (key1 UInt32, sign Int8) engine = CollapsingMergeTree(sign) order by (key1) partition by (key1 / $((layers * 8192)))::UInt64;
     insert into tbl_8parts_${layers}granules_seq select number, 1 from numbers_mt($((layers * 8 * 8192)));
     optimize table tbl_8parts_${layers}granules_seq final;
-    explain pipeline select * from tbl_8parts_${layers}granules_seq final settings max_threads = 8;" 2>&1 |
+    explain pipeline select * from tbl_8parts_${layers}granules_seq final settings max_threads = 8, do_not_merge_across_partitions_select_final = 0;
+    drop table tbl_8parts_${layers}granules_seq;" 2>&1 |
        grep -c "CollapsingSortedTransform"
 }
 
 for layers in 2 3 5 8 16; do
   test_sequential_values $layers
 done;
+
+echo "Test non intersecting ranges finished"
diff --git a/tests/queries/0_stateless/02294_floating_point_second_in_settings.sh b/tests/queries/0_stateless/02294_floating_point_second_in_settings.sh
index b5bf2deb974..7a18b8fea29 100755
--- a/tests/queries/0_stateless/02294_floating_point_second_in_settings.sh
+++ b/tests/queries/0_stateless/02294_floating_point_second_in_settings.sh
@@ -38,4 +38,4 @@ check_output "${OUTPUT}"
 
 # CHECK system.settings
 echo "TABLE: system.settings"
-echo "SELECT name, value, changed from system.settings where name = 'max_execution_time'" | clickhouse-client --max_execution_time 30.5
+echo "SELECT name, value, changed from system.settings where name = 'max_execution_time'" | $CLICKHOUSE_CLIENT_BINARY --max_execution_time 30.5
diff --git a/tests/queries/0_stateless/02296_ttl_non_deterministic.reference b/tests/queries/0_stateless/02296_ttl_non_deterministic.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02296_ttl_non_deterministic.sql b/tests/queries/0_stateless/02296_ttl_non_deterministic.sql
new file mode 100644
index 00000000000..14d8979a624
--- /dev/null
+++ b/tests/queries/0_stateless/02296_ttl_non_deterministic.sql
@@ -0,0 +1,34 @@
+-- Tags: replica
+
+DROP TABLE IF EXISTS t_ttl_non_deterministic;
+
+CREATE TABLE t_ttl_non_deterministic(A Int64)
+ENGINE = MergeTree ORDER BY A TTL now() + toIntervalMonth(1); -- {serverError BAD_ARGUMENTS}
+
+CREATE TABLE t_ttl_non_deterministic(A Int64)
+ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/ttl1', '1') ORDER BY A TTL now() + toIntervalMonth(1); -- {serverError BAD_ARGUMENTS}
+
+
+CREATE TABLE t_ttl_non_deterministic(A Int64) ENGINE = MergeTree ORDER BY A;
+ALTER TABLE t_ttl_non_deterministic MODIFY TTL now() + toIntervalMonth(1); -- {serverError BAD_ARGUMENTS}
+DROP TABLE t_ttl_non_deterministic;
+
+CREATE TABLE t_ttl_non_deterministic(A Int64) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/ttl2', '1') ORDER BY A;
+ALTER TABLE t_ttl_non_deterministic MODIFY TTL now() + toIntervalMonth(1); -- {serverError BAD_ARGUMENTS}
+DROP TABLE t_ttl_non_deterministic;
+
+
+CREATE TABLE t_ttl_non_deterministic(A Int64, B Int64 TTL now() + toIntervalMonth(1))
+ENGINE = MergeTree ORDER BY A; -- {serverError BAD_ARGUMENTS}
+
+CREATE TABLE t_ttl_non_deterministic(A Int64, B Int64 TTL now() + toIntervalMonth(1))
+ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/ttl3', '1') ORDER BY A; -- {serverError BAD_ARGUMENTS}
+
+
+CREATE TABLE t_ttl_non_deterministic(A Int64, B Int64) ENGINE = MergeTree ORDER BY A;
+ALTER TABLE t_ttl_non_deterministic MODIFY COLUMN B Int64 TTL now() + toIntervalMonth(1); -- {serverError BAD_ARGUMENTS}
+DROP TABLE t_ttl_non_deterministic;
+
+CREATE TABLE t_ttl_non_deterministic(A Int64, B Int64) ENGINE = ReplicatedMergeTree('/clickhouse/tables/{database}/ttl4', '1') ORDER BY A;
+ALTER TABLE t_ttl_non_deterministic MODIFY COLUMN B Int64 TTL now() + toIntervalMonth(1); -- {serverError BAD_ARGUMENTS}
+DROP TABLE t_ttl_non_deterministic;
diff --git a/tests/queries/0_stateless/02297_regex_parsing_file_names.sh b/tests/queries/0_stateless/02297_regex_parsing_file_names.sh
index 12ccb54235b..5973e24844a 100755
--- a/tests/queries/0_stateless/02297_regex_parsing_file_names.sh
+++ b/tests/queries/0_stateless/02297_regex_parsing_file_names.sh
@@ -9,7 +9,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 
 # Now we can get the user_files_path by use the table file function for trick. also we can get it by query as:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-CLICKHOUSE_USER_FILES_PATH=$(clickhouse-client --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+CLICKHOUSE_USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p ${CLICKHOUSE_USER_FILES_PATH}/
 
diff --git a/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.reference b/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.reference
index 7f4ba0901b6..0b0b4175e1f 100644
--- a/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.reference
+++ b/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.reference
@@ -33,3 +33,38 @@ Get descendants at first level
 []
 []
 []
+Get hierarchy
+[]
+[1]
+[2,1]
+[3,1]
+[4,2,1]
+[]
+Get is in hierarchy
+0
+1
+1
+1
+1
+0
+Get children
+[1]
+[2,3]
+[4]
+[]
+[]
+[]
+Get all descendants
+[1,2,3,4]
+[2,3,4]
+[4]
+[]
+[]
+[]
+Get descendants at first level
+[1]
+[2,3]
+[4]
+[]
+[]
+[]
diff --git a/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.sql b/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.sql.j2
similarity index 91%
rename from tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.sql
rename to tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.sql.j2
index a775f0e5cbf..bc13bcfdb09 100644
--- a/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.sql
+++ b/tests/queries/0_stateless/02311_hashed_array_dictionary_hierarchical_functions.sql.j2
@@ -7,6 +7,8 @@ CREATE TABLE hierarchy_source_table
 
 INSERT INTO hierarchy_source_table VALUES (1, 0), (2, 1), (3, 1), (4, 2);
 
+{% for dictionary_config in ['', 'SHARDS 16'] -%}
+
 DROP DICTIONARY IF EXISTS hierarchy_hashed_array_dictionary;
 CREATE DICTIONARY hierarchy_hashed_array_dictionary
 (
@@ -15,7 +17,7 @@ CREATE DICTIONARY hierarchy_hashed_array_dictionary
 )
 PRIMARY KEY id
 SOURCE(CLICKHOUSE(TABLE 'hierarchy_source_table'))
-LAYOUT(HASHED_ARRAY())
+LAYOUT(HASHED_ARRAY({{ dictionary_config }}))
 LIFETIME(MIN 1 MAX 1000);
 
 SELECT 'Get hierarchy';
@@ -29,6 +31,8 @@ SELECT dictGetDescendants('hierarchy_hashed_array_dictionary', number) FROM syst
 SELECT 'Get descendants at first level';
 SELECT dictGetDescendants('hierarchy_hashed_array_dictionary', number, 1) FROM system.numbers LIMIT 6;
 
+{% endfor %}
+
 DROP DICTIONARY hierarchy_hashed_array_dictionary;
 
 DROP TABLE hierarchy_source_table;
diff --git a/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.reference b/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.reference
index 60d9fb16c5f..ab6a247219b 100644
--- a/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.reference
+++ b/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.reference
@@ -106,6 +106,42 @@ Get descendants at first level
 []
 []
 []
+HashedArray dictionary
+Get hierarchy
+[0]
+[1,0]
+[2,1,0]
+[3]
+[4,2,1,0]
+[]
+Get is in hierarchy
+1
+1
+1
+1
+1
+0
+Get children
+[1]
+[2]
+[4]
+[]
+[]
+[]
+Get all descendants
+[1,2,4]
+[2,4]
+[4]
+[]
+[]
+[]
+Get descendants at first level
+[1]
+[2]
+[4]
+[]
+[]
+[]
 Cache dictionary
 Get hierarchy
 [0]
diff --git a/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.sql b/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.sql.j2
similarity index 97%
rename from tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.sql
rename to tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.sql.j2
index d477d58d398..b456495513e 100644
--- a/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.sql
+++ b/tests/queries/0_stateless/02316_hierarchical_dictionaries_nullable_parent_key.sql.j2
@@ -56,7 +56,7 @@ SELECT 'Get descendants at first level';
 SELECT dictGetDescendants('hierachical_hashed_dictionary', number, 1) FROM system.numbers LIMIT 6;
 
 DROP DICTIONARY hierachical_hashed_dictionary;
-
+{% for dictionary_config in ['', 'SHARDS 16'] -%}
 DROP DICTIONARY IF EXISTS hierachical_hashed_array_dictionary;
 CREATE DICTIONARY hierachical_hashed_array_dictionary
 (
@@ -64,7 +64,7 @@ CREATE DICTIONARY hierachical_hashed_array_dictionary
     parent_id Nullable(UInt64) HIERARCHICAL
 ) PRIMARY KEY id
 SOURCE(CLICKHOUSE(TABLE 'test_hierarhical_table'))
-LAYOUT(HASHED_ARRAY())
+LAYOUT(HASHED_ARRAY({{ dictionary_config }}))
 LIFETIME(0);
 
 SELECT 'HashedArray dictionary';
@@ -82,6 +82,8 @@ SELECT dictGetDescendants('hierachical_hashed_array_dictionary', number, 1) FROM
 
 DROP DICTIONARY hierachical_hashed_array_dictionary;
 
+{% endfor %}
+
 DROP DICTIONARY IF EXISTS hierachical_cache_dictionary;
 CREATE DICTIONARY hierachical_cache_dictionary
 (
diff --git a/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh b/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh
index 69e65112305..dfc0dedeaf1 100755
--- a/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh
+++ b/tests/queries/0_stateless/02327_capnproto_protobuf_empty_messages.sh
@@ -5,10 +5,10 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 touch $USER_FILES_PATH/data.capnp
 
-SCHEMADIR=$(clickhouse-client --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
+SCHEMADIR=$($CLICKHOUSE_CLIENT_BINARY --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
 CLIENT_SCHEMADIR=$CURDIR/format_schemas
 SERVER_SCHEMADIR=test_02327
 mkdir -p $SCHEMADIR/$SERVER_SCHEMADIR
diff --git a/tests/queries/0_stateless/02344_describe_cache.reference b/tests/queries/0_stateless/02344_describe_cache.reference
index 9a7e579c95c..db8182e30bb 100644
--- a/tests/queries/0_stateless/02344_describe_cache.reference
+++ b/tests/queries/0_stateless/02344_describe_cache.reference
@@ -1,2 +1,2 @@
 1
-102400	10000000	33554432	4194304	0	0	0	0	/var/lib/clickhouse/filesystem_caches/02344_describe_cache_test	5	5000	0	1
+102400	10000000	33554432	4194304	0	0	0	0	/var/lib/clickhouse/filesystem_caches/02344_describe_cache_test	5	5000	0	16
diff --git a/tests/queries/0_stateless/02352_lightweight_delete.reference b/tests/queries/0_stateless/02352_lightweight_delete.reference
index 3386b3294c3..ce7c6e81ac8 100644
--- a/tests/queries/0_stateless/02352_lightweight_delete.reference
+++ b/tests/queries/0_stateless/02352_lightweight_delete.reference
@@ -26,7 +26,7 @@ Rows in parts	800000
 Count	700000
 First row	300000	1
 Do ALTER DELETE mutation that does a "heavyweight" delete
-Rows in parts	533333
+Rows in parts	466666
 Count	466666
 First row	300001	10
 Delete 100K more rows using lightweight DELETE
diff --git a/tests/queries/0_stateless/02352_rwlock.sh b/tests/queries/0_stateless/02352_rwlock.sh
index 7de2c7089b8..08551794c2e 100755
--- a/tests/queries/0_stateless/02352_rwlock.sh
+++ b/tests/queries/0_stateless/02352_rwlock.sh
@@ -21,7 +21,7 @@ function wait_query_by_id_started()
     # wait for query to be started
     while [ "$($CLICKHOUSE_CLIENT "$@" -q "select count() from system.processes where query_id = '$query_id'")" -ne 1 ]; do
         if [ "$(
-            $CLICKHOUSE_CLIENT -nm -q "
+            $CLICKHOUSE_CLIENT --max_bytes_before_external_group_by 0 -nm -q "
                 system flush logs;
 
                 select count() from system.query_log
@@ -56,7 +56,7 @@ while :; do
 
     insert_query_id="insert-$(random_str 10)"
     # 20 seconds sleep
-    $CLICKHOUSE_CLIENT --function_sleep_max_microseconds_per_block 20000000 --query_id "$insert_query_id" -q "INSERT INTO ${CLICKHOUSE_DATABASE}_ordinary.data_02352 SELECT sleepEachRow(1) FROM numbers(20) GROUP BY number" &
+    $CLICKHOUSE_CLIENT --function_sleep_max_microseconds_per_block 20000000 --max_bytes_before_external_group_by 0 --query_id "$insert_query_id" -q "INSERT INTO ${CLICKHOUSE_DATABASE}_ordinary.data_02352 SELECT sleepEachRow(1) FROM numbers(20) GROUP BY number" &
     if ! wait_query_by_id_started "$insert_query_id"; then
         wait
         continue
diff --git a/tests/queries/0_stateless/02353_compression_level.sh b/tests/queries/0_stateless/02353_compression_level.sh
index b08dc1e204c..8d6a9c899ad 100755
--- a/tests/queries/0_stateless/02353_compression_level.sh
+++ b/tests/queries/0_stateless/02353_compression_level.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 WORKING_FOLDER_02353="${USER_FILES_PATH}/${CLICKHOUSE_DATABASE}"
 
 rm -rf "${WORKING_FOLDER_02353}"
diff --git a/tests/queries/0_stateless/02358_file_default_value.sh b/tests/queries/0_stateless/02358_file_default_value.sh
index 7d2cb75c4e4..a7c4c17c129 100755
--- a/tests/queries/0_stateless/02358_file_default_value.sh
+++ b/tests/queries/0_stateless/02358_file_default_value.sh
@@ -4,7 +4,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 WORKING_FOLDER_02357="${USER_FILES_PATH}/${CLICKHOUSE_DATABASE}"
 
 rm -rf "${WORKING_FOLDER_02357}"
diff --git a/tests/queries/0_stateless/02360_clickhouse_local_config-option.sh b/tests/queries/0_stateless/02360_clickhouse_local_config-option.sh
index df0bdf38b4d..b58cfd7ec21 100755
--- a/tests/queries/0_stateless/02360_clickhouse_local_config-option.sh
+++ b/tests/queries/0_stateless/02360_clickhouse_local_config-option.sh
@@ -6,6 +6,9 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
+SAFE_DIR="${CUR_DIR}/${CLICKHOUSE_DATABASE}_02360_local"
+mkdir -p "${SAFE_DIR}"
+
 echo "<clickhouse>
     <logger>
         <level>trace</level>
@@ -14,7 +17,7 @@ echo "<clickhouse>
 
     <tcp_port>9000</tcp_port>
 
-    <path>./</path>
+    <path>${SAFE_DIR}</path>
 
     <mark_cache_size>0</mark_cache_size>
     <user_directories>
@@ -23,7 +26,7 @@ echo "<clickhouse>
             <path>users.xml</path>
         </users_xml>
     </user_directories>
-</clickhouse>" > $CUR_DIR/config.xml
+</clickhouse>" > $SAFE_DIR/config.xml
 
 echo        "<clickhouse>
             <profiles>
@@ -42,13 +45,12 @@ echo        "<clickhouse>
             <quotas>
                 <default></default>
             </quotas>
-        </clickhouse>" > $CUR_DIR/users.xml
+        </clickhouse>" > $SAFE_DIR/users.xml
 
 local_opts=(
-    "--config-file=$CUR_DIR/config.xml"
+    "--config-file=$SAFE_DIR/config.xml"
     "--send_logs_level=none")
 
 ${CLICKHOUSE_LOCAL} "${local_opts[@]}" --query 'Select 1' |& grep -v -e 'Processing configuration file'
 
-rm -rf $CUR_DIR/users.xml
-rm -rf $CUR_DIR/config.xml
+rm -rf "${SAFE_DIR}"
diff --git a/tests/queries/0_stateless/02366_kql_extend.sql b/tests/queries/0_stateless/02366_kql_extend.sql
index 3de489b0815..0a3c1f3dcd4 100644
--- a/tests/queries/0_stateless/02366_kql_extend.sql
+++ b/tests/queries/0_stateless/02366_kql_extend.sql
@@ -12,16 +12,19 @@
 --     'Costco','Snargaluff',200,'2016-09-10',
 -- ]
 
+
 DROP TABLE IF EXISTS Ledger;
 CREATE TABLE Ledger
-(    
+(
    Supplier Nullable(String),
    Fruit String ,
    Price Float64,
-   Purchase Date 
+   Purchase Date
 ) ENGINE = Memory;
 INSERT INTO Ledger VALUES  ('Aldi','Apple',4,'2016-09-10'), ('Costco','Apple',2,'2016-09-11'), ('Aldi','Apple',6,'2016-09-10'), ('Costco','Snargaluff',100,'2016-09-12'), ('Aldi','Apple',7,'2016-09-12'), ('Aldi','Snargaluff',400,'2016-09-11'),('Costco','Snargaluff',104,'2016-09-12'),('Aldi','Apple',5,'2016-09-12'),('Aldi','Snargaluff',600,'2016-09-11'),('Costco','Snargaluff',200,'2016-09-10');
 
+-- This test requies sorting after some of aggregations but I don't know KQL, sorry
+set max_bytes_before_external_group_by = 0;
 set dialect = 'kusto';
 
 print '-- extend #1 --';
diff --git a/tests/queries/0_stateless/02366_kql_makeseries.sql b/tests/queries/0_stateless/02366_kql_makeseries.sql
index ecf2ef43cc4..c9ca91c0be0 100644
--- a/tests/queries/0_stateless/02366_kql_makeseries.sql
+++ b/tests/queries/0_stateless/02366_kql_makeseries.sql
@@ -14,31 +14,34 @@
 -- ];
 DROP TABLE IF EXISTS make_series_test_table;
 CREATE TABLE make_series_test_table
-(    
+(
    Supplier Nullable(String),
    Fruit String ,
    Price Float64,
-   Purchase Date 
+   Purchase Date
 ) ENGINE = Memory;
 INSERT INTO make_series_test_table VALUES  ('Aldi','Apple',4,'2016-09-10'), ('Costco','Apple',2,'2016-09-11'), ('Aldi','Apple',6,'2016-09-10'), ('Costco','Snargaluff',100,'2016-09-12'), ('Aldi','Apple',7,'2016-09-12'), ('Aldi','Snargaluff',400,'2016-09-11'),('Costco','Snargaluff',104,'2016-09-12'),('Aldi','Apple',5,'2016-09-12'),('Aldi','Snargaluff',600,'2016-09-11'),('Costco','Snargaluff',200,'2016-09-10');
 DROP TABLE IF EXISTS make_series_test_table2;
 CREATE TABLE make_series_test_table2
-(    
+(
    Supplier Nullable(String),
    Fruit String ,
    Price Int32,
-   Purchase Int32  
+   Purchase Int32
 ) ENGINE = Memory;
 INSERT INTO make_series_test_table2 VALUES  ('Aldi','Apple',4,10),('Costco','Apple',2,11),('Aldi','Apple',6,10),('Costco','Snargaluff',100,12),('Aldi','Apple',7,12),('Aldi','Snargaluff',400,11),('Costco','Snargaluff',104,12),('Aldi','Apple',5,12),('Aldi','Snargaluff',600,11),('Costco','Snargaluff',200,10);
 DROP TABLE IF EXISTS make_series_test_table3;
 CREATE TABLE make_series_test_table3
-(    
+(
     timestamp datetime,
     metric Float64,
 ) ENGINE = Memory;
 INSERT INTO make_series_test_table3 VALUES (parseDateTimeBestEffort('2016-12-31T06:00', 'UTC'), 50), (parseDateTimeBestEffort('2017-01-01', 'UTC'), 4), (parseDateTimeBestEffort('2017-01-02', 'UTC'), 3), (parseDateTimeBestEffort('2017-01-03', 'UTC'), 4), (parseDateTimeBestEffort('2017-01-03T03:00', 'UTC'), 6), (parseDateTimeBestEffort('2017-01-05', 'UTC'), 8), (parseDateTimeBestEffort('2017-01-05T13:40', 'UTC'), 13), (parseDateTimeBestEffort('2017-01-06', 'UTC'), 4), (parseDateTimeBestEffort('2017-01-07', 'UTC'), 3), (parseDateTimeBestEffort('2017-01-08', 'UTC'), 8), (parseDateTimeBestEffort('2017-01-08T21:00', 'UTC'), 8), (parseDateTimeBestEffort('2017-01-09', 'UTC'), 2), (parseDateTimeBestEffort('2017-01-09T12:00', 'UTC'), 11), (parseDateTimeBestEffort('2017-01-10T05:00', 'UTC'), 5);
 
+-- This test requies sorting after some of aggregations but I don't know KQL, sorry
+set max_bytes_before_external_group_by = 0;
 set dialect = 'kusto';
+
 print '-- from to';
 make_series_test_table |  make-series PriceAvg = avg(Price) default=0 on Purchase from datetime(2016-09-10)  to datetime(2016-09-13) step 1d by Supplier, Fruit | order by Supplier, Fruit;
 print '-- from';
@@ -68,7 +71,7 @@ make_series_test_table2 | make-series PriceAvg=avg(Price) default=0 on Purchase
 print '-- without by';
 make_series_test_table2 | make-series PriceAvg=avg(Price) default=0 on Purchase step  2.0;
 
-make_series_test_table3 | make-series avg(metric) default=0  on timestamp from datetime(2017-01-01) to datetime(2017-01-10) step 1d 
+make_series_test_table3 | make-series avg(metric) default=0  on timestamp from datetime(2017-01-01) to datetime(2017-01-10) step 1d
 
 -- print '-- summarize --'
 -- make_series_test_table | summarize count() by format_datetime(bin(Purchase, 1d), 'yy-MM-dd');
diff --git a/tests/queries/0_stateless/02373_heap_buffer_overflow_in_avro.sh b/tests/queries/0_stateless/02373_heap_buffer_overflow_in_avro.sh
index 23d6b722c09..3461287d28a 100755
--- a/tests/queries/0_stateless/02373_heap_buffer_overflow_in_avro.sh
+++ b/tests/queries/0_stateless/02373_heap_buffer_overflow_in_avro.sh
@@ -5,9 +5,8 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 cp $CURDIR/data_avro/corrupted.avro $USER_FILES_PATH/
 
 $CLICKHOUSE_CLIENT -q "select * from file(corrupted.avro)" 2>&1 | grep -F -q "Cannot read compressed data" && echo "OK" || echo "FAIL"
-
diff --git a/tests/queries/0_stateless/02375_system_schema_inference_cache.reference b/tests/queries/0_stateless/02375_system_schema_inference_cache.reference
index 94bdf1b5ddb..676fb441f53 100644
--- a/tests/queries/0_stateless/02375_system_schema_inference_cache.reference
+++ b/tests/queries/0_stateless/02375_system_schema_inference_cache.reference
@@ -5,6 +5,7 @@ additional_format_info	String
 registration_time	DateTime					
 schema	Nullable(String)					
 number_of_rows	Nullable(UInt64)					
+schema_inference_mode	Nullable(String)					
 x	Nullable(Int64)					
 s	Nullable(String)					
 x	Nullable(Int64)					
diff --git a/tests/queries/0_stateless/02375_system_schema_inference_cache.sql b/tests/queries/0_stateless/02375_system_schema_inference_cache.sql
index 6f656b16c69..310e22ed31f 100644
--- a/tests/queries/0_stateless/02375_system_schema_inference_cache.sql
+++ b/tests/queries/0_stateless/02375_system_schema_inference_cache.sql
@@ -1,4 +1,4 @@
--- Tags: no-fasttest
+-- Tags: no-fasttest, no-parallel
 
 set input_format_json_try_infer_numbers_from_strings=1;
 insert into function file('02374_data1.jsonl') select number as x, 'str' as s from numbers(10);
diff --git a/tests/queries/0_stateless/02383_arrow_dict_special_cases.sh b/tests/queries/0_stateless/02383_arrow_dict_special_cases.sh
index 40487f16551..80743a97dd0 100755
--- a/tests/queries/0_stateless/02383_arrow_dict_special_cases.sh
+++ b/tests/queries/0_stateless/02383_arrow_dict_special_cases.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 UNIQ_DEST_PATH=$USER_FILES_PATH/test-02383-$RANDOM-$RANDOM
 mkdir -p $UNIQ_DEST_PATH
 
diff --git a/tests/queries/0_stateless/02402_capnp_format_segments_overflow.sh b/tests/queries/0_stateless/02402_capnp_format_segments_overflow.sh
index 244b94d9189..8aad68ffe5c 100755
--- a/tests/queries/0_stateless/02402_capnp_format_segments_overflow.sh
+++ b/tests/queries/0_stateless/02402_capnp_format_segments_overflow.sh
@@ -5,11 +5,11 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 mkdir -p $USER_FILES_PATH/test_02402
 cp $CURDIR/data_capnp/overflow.capnp $USER_FILES_PATH/test_02402/
 
-SCHEMADIR=$(clickhouse-client --query "select * from file('test_02402/overflow.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
+SCHEMADIR=$($CLICKHOUSE_CLIENT_BINARY --query "select * from file('test_02402/overflow.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
 
 CLIENT_SCHEMADIR=$CURDIR/format_schemas
 SERVER_SCHEMADIR=test_02402
diff --git a/tests/queries/0_stateless/02406_minmax_behaviour.reference b/tests/queries/0_stateless/02406_minmax_behaviour.reference
new file mode 100644
index 00000000000..d52ba640a0e
--- /dev/null
+++ b/tests/queries/0_stateless/02406_minmax_behaviour.reference
@@ -0,0 +1,192 @@
+-- { echoOn }
+SET compile_aggregate_expressions=0;
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    min(data),
+    min(data2),
+    min(data3),
+    min(data4),
+    min(data5);
+1	nan	1	nan	nan
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    max(data),
+    max(data2),
+    max(data3),
+    max(data4),
+    max(data5);
+5	nan	4	nan	nan
+Select max(number) from numbers(100) settings max_threads=1, max_block_size=10;
+99
+Select max(-number) from numbers(100);
+0
+Select min(number) from numbers(100) settings max_threads=1, max_block_size=10;
+0
+Select min(-number) from numbers(100);
+-99
+SELECT minIf(number, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+0
+SELECT maxIf(number, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+0
+SELECT minIf(number::Float64, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+0
+SELECT maxIf(number::Float64, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+0
+SELECT minIf(number::String, number < 10) as number from numbers(10, 1000);
+
+SELECT maxIf(number::String, number < 10) as number from numbers(10, 1000);
+
+SELECT maxIf(number::String, number % 3), maxIf(number::String, number % 5), minIf(number::String, number % 3), minIf(number::String, number > 10) from numbers(400);
+98	99	1	100
+SELECT minIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+\N
+SELECT maxIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+\N
+SELECT min(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
+22
+SELECT max(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
+26
+SELECT argMax(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMax(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMax(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMax(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMax(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMax(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMax(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10009
+SELECT argMax(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10009
+SELECT argMaxIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10009
+SELECT argMaxIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10009
+SELECT argMaxIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+0
+SELECT argMaxIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+0
+SELECT argMax(number, number::Float64) from numbers(2029);
+2028
+SELECT argMaxIf(number, number::Float64, number > 2030) from numbers(2029);
+0
+SELECT argMaxIf(number, number::Float64, number > 2030) from numbers(2032);
+2031
+SELECT argMax(number, -number::Float64) from numbers(2029);
+0
+SELECT argMaxIf(number, -number::Float64, number > 2030) from numbers(2029);
+0
+SELECT argMaxIf(number, -number::Float64, number > 2030) from numbers(2032);
+2031
+SELECT argMin(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMin(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMin(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMin(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMin(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMin(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMin(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMin(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMinIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+10
+SELECT argMinIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+10
+SELECT argMinIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+0
+SELECT argMinIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+0
+SELECT argMin(number, number::Float64) from numbers(2029);
+0
+SELECT argMinIf(number, number::Float64, number > 2030) from numbers(2029);
+0
+SELECT argMinIf(number, number::Float64, number > 2030) from numbers(2032);
+2031
+SELECT argMin(number, -number::Float64) from numbers(2029);
+2028
+SELECT argMinIf(number, -number::Float64, number > 2030) from numbers(2029);
+0
+SELECT argMinIf(number, -number::Float64, number > 2030) from numbers(2032);
+2031
+Select argMax((n, n), n) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+(8,8)	Tuple(Nullable(UInt64), Nullable(UInt64))
+Select argMaxIf((n, n), n, n < 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+(4,4)	Tuple(Nullable(UInt64), Nullable(UInt64))
+Select argMaxIf((n, n), n, n > 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+(8,8)	Tuple(Nullable(UInt64), Nullable(UInt64))
+Select argMin((n, n), n) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+(1,1)	Tuple(Nullable(UInt64), Nullable(UInt64))
+Select argMinIf((n, n), n, n < 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+(1,1)	Tuple(Nullable(UInt64), Nullable(UInt64))
+Select argMinIf((n, n), n, n > 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+(7,7)	Tuple(Nullable(UInt64), Nullable(UInt64))
+SET compile_aggregate_expressions=1;
+SET min_count_to_compile_aggregate_expression=0;
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    min(data),
+    min(data2),
+    min(data3),
+    min(data4),
+    min(data5);
+1	nan	1	nan	nan
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    max(data),
+    max(data2),
+    max(data3),
+    max(data4),
+    max(data5);
+5	nan	4	nan	nan
+SELECT minIf(number, rand() % 2 == 3) from numbers(10);
+0
+SELECT maxIf(number, rand() % 2 == 3) from numbers(10);
+0
+SELECT minIf(number::Float64, rand() % 2 == 3) from numbers(10);
+0
+SELECT maxIf(number::Float64, rand() % 2 == 3) from numbers(10);
+0
+SELECT minIf(number::String, number < 10) as number from numbers(10, 1000);
+
+SELECT maxIf(number::String, number < 10) as number from numbers(10, 1000);
+
+SELECT maxIf(number::String, number % 3), maxIf(number::String, number % 5), minIf(number::String, number % 3), minIf(number::String, number > 10) from numbers(400);
+98	99	1	100
+SELECT minIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+\N
+SELECT maxIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+\N
+SELECT min(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
+22
+SELECT max(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
+26
diff --git a/tests/queries/0_stateless/02406_minmax_behaviour.sql b/tests/queries/0_stateless/02406_minmax_behaviour.sql
new file mode 100644
index 00000000000..a3afe7d40b0
--- /dev/null
+++ b/tests/queries/0_stateless/02406_minmax_behaviour.sql
@@ -0,0 +1,140 @@
+-- { echoOn }
+SET compile_aggregate_expressions=0;
+
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    min(data),
+    min(data2),
+    min(data3),
+    min(data4),
+    min(data5);
+
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    max(data),
+    max(data2),
+    max(data3),
+    max(data4),
+    max(data5);
+
+Select max(number) from numbers(100) settings max_threads=1, max_block_size=10;
+Select max(-number) from numbers(100);
+Select min(number) from numbers(100) settings max_threads=1, max_block_size=10;
+Select min(-number) from numbers(100);
+
+SELECT minIf(number, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+SELECT maxIf(number, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+
+SELECT minIf(number::Float64, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+SELECT maxIf(number::Float64, rand() % 2 == 3) from numbers(10) settings max_threads=1, max_block_size=5;
+
+SELECT minIf(number::String, number < 10) as number from numbers(10, 1000);
+SELECT maxIf(number::String, number < 10) as number from numbers(10, 1000);
+SELECT maxIf(number::String, number % 3), maxIf(number::String, number % 5), minIf(number::String, number % 3), minIf(number::String, number > 10) from numbers(400);
+
+SELECT minIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+SELECT maxIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+
+SELECT min(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
+SELECT max(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
+
+SELECT argMax(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMax(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMax(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMax(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMax(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMax(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMax(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMax(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMaxIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMaxIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMaxIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMaxIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMax(number, number::Float64) from numbers(2029);
+SELECT argMaxIf(number, number::Float64, number > 2030) from numbers(2029);
+SELECT argMaxIf(number, number::Float64, number > 2030) from numbers(2032);
+SELECT argMax(number, -number::Float64) from numbers(2029);
+SELECT argMaxIf(number, -number::Float64, number > 2030) from numbers(2029);
+SELECT argMaxIf(number, -number::Float64, number > 2030) from numbers(2032);
+
+SELECT argMin(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMin(number, now()) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMin(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMin(number, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMin(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMin(number::String, 1) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMin(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMin(number, now() + number) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMinIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMinIf(number, now() + number, number % 10 < 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMinIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=100;
+SELECT argMinIf(number, now() + number, number % 10 > 20) FROM (Select number as number from numbers(10, 10000)) settings max_threads=1, max_block_size=20000;
+SELECT argMin(number, number::Float64) from numbers(2029);
+SELECT argMinIf(number, number::Float64, number > 2030) from numbers(2029);
+SELECT argMinIf(number, number::Float64, number > 2030) from numbers(2032);
+SELECT argMin(number, -number::Float64) from numbers(2029);
+SELECT argMinIf(number, -number::Float64, number > 2030) from numbers(2029);
+SELECT argMinIf(number, -number::Float64, number > 2030) from numbers(2032);
+
+Select argMax((n, n), n) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+Select argMaxIf((n, n), n, n < 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+Select argMaxIf((n, n), n, n > 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+
+Select argMin((n, n), n) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+Select argMinIf((n, n), n, n < 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+Select argMinIf((n, n), n, n > 5) t, toTypeName(t) FROM (Select if(number % 3 == 0, NULL, number) as n from numbers(10));
+
+SET compile_aggregate_expressions=1;
+SET min_count_to_compile_aggregate_expression=0;
+
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    min(data),
+    min(data2),
+    min(data3),
+    min(data4),
+    min(data5);
+
+WITH
+    arrayJoin([1, 2, 3, nan, 4, 5]) AS data,
+    arrayJoin([nan, 1, 2, 3, 4]) AS data2,
+    arrayJoin([1, 2, 3, 4, nan]) AS data3,
+    arrayJoin([nan, nan, nan]) AS data4,
+    arrayJoin([nan, 1, 2, 3, nan]) AS data5
+SELECT
+    max(data),
+    max(data2),
+    max(data3),
+    max(data4),
+    max(data5);
+
+SELECT minIf(number, rand() % 2 == 3) from numbers(10);
+SELECT maxIf(number, rand() % 2 == 3) from numbers(10);
+
+SELECT minIf(number::Float64, rand() % 2 == 3) from numbers(10);
+SELECT maxIf(number::Float64, rand() % 2 == 3) from numbers(10);
+
+SELECT minIf(number::String, number < 10) as number from numbers(10, 1000);
+SELECT maxIf(number::String, number < 10) as number from numbers(10, 1000);
+SELECT maxIf(number::String, number % 3), maxIf(number::String, number % 5), minIf(number::String, number % 3), minIf(number::String, number > 10) from numbers(400);
+
+SELECT minIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+SELECT maxIf(number::Nullable(String), number < 10) as number from numbers(10, 1000);
+
+SELECT min(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
+SELECT max(n::Nullable(String)) from (Select if(number < 15 and number % 2 == 1, number * 2, NULL) as n from numbers(10, 20));
diff --git a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
index 7bb0b965fbc..379eea4dbbb 100644
--- a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
+++ b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.reference
@@ -320,7 +320,6 @@ geoDistance
 geohashDecode
 geohashEncode
 geohashesInBox
-getClientHTTPHeader
 getMacro
 getOSKernelVersion
 getServerPort
diff --git a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.sql b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.sql
index 729a0b3995c..cabcd230eb6 100644
--- a/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.sql
+++ b/tests/queries/0_stateless/02415_all_new_functions_must_be_documented.sql
@@ -2,7 +2,6 @@
 -- Please help shorten this list down to zero elements.
 SELECT name FROM system.functions WHERE NOT is_aggregate AND origin = 'System' AND alias_to = '' AND length(description) < 10
 AND name NOT IN (
-    'MD4', 'MD5', 'SHA1', 'SHA224', 'SHA256', 'SHA384', 'SHA512', 'halfMD5', 'sqid',
     'aes_decrypt_mysql', 'aes_encrypt_mysql', 'decrypt', 'encrypt',
     'base64Decode', 'base64Encode', 'tryBase64Decode',
     'convertCharset',
diff --git a/tests/queries/0_stateless/02421_record_errors_row_by_input_format.sh b/tests/queries/0_stateless/02421_record_errors_row_by_input_format.sh
index dda61512936..df304eeeba5 100755
--- a/tests/queries/0_stateless/02421_record_errors_row_by_input_format.sh
+++ b/tests/queries/0_stateless/02421_record_errors_row_by_input_format.sh
@@ -9,7 +9,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 
 # Data preparation.
 
-CLICKHOUSE_USER_FILES_PATH=$(clickhouse-client --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+CLICKHOUSE_USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p ${CLICKHOUSE_USER_FILES_PATH}/
 echo -e "1,1\n2,a\nb,3\n4,4\n5,c\n6,6" > ${CLICKHOUSE_USER_FILES_PATH}/a.csv
@@ -32,4 +32,3 @@ ${CLICKHOUSE_CLIENT} --query "drop table if exists data;"
 rm ${CLICKHOUSE_USER_FILES_PATH}/a.csv
 rm ${CLICKHOUSE_USER_FILES_PATH}/errors_server
 rm ${CLICKHOUSE_USER_FILES_PATH}/errors_client
-
diff --git a/tests/queries/0_stateless/02428_combinators_with_over_statement.sql b/tests/queries/0_stateless/02428_combinators_with_over_statement.sql
index b42066cdf52..7946b997b00 100644
--- a/tests/queries/0_stateless/02428_combinators_with_over_statement.sql
+++ b/tests/queries/0_stateless/02428_combinators_with_over_statement.sql
@@ -1,6 +1,6 @@
 drop table if exists test;
 create table test (x AggregateFunction(uniq, UInt64), y Int64) engine=Memory;
-insert into test select uniqState(number) as x, number as y from numbers(10) group by number;
+insert into test select uniqState(number) as x, number as y from numbers(10) group by number order by x, y;
 select uniqStateMap(map(1, x)) OVER (PARTITION BY y) from test;
 select uniqStateForEach([x]) OVER (PARTITION BY y) from test;
 select uniqStateResample(30, 75, 30)([x], 30) OVER (PARTITION BY y) from test;
diff --git a/tests/queries/0_stateless/02447_drop_database_replica.sh b/tests/queries/0_stateless/02447_drop_database_replica.sh
index 47a6cf10bda..d5b3ceef46a 100755
--- a/tests/queries/0_stateless/02447_drop_database_replica.sh
+++ b/tests/queries/0_stateless/02447_drop_database_replica.sh
@@ -55,7 +55,15 @@ $CLICKHOUSE_CLIENT --allow_experimental_database_replicated=1 -q "create databas
 $CLICKHOUSE_CLIENT -q "system sync database replica $db4"
 $CLICKHOUSE_CLIENT -q "select cluster, shard_num, replica_num, database_shard_name, database_replica_name, is_active from system.clusters where cluster='$db4'"
 
+# Don't throw "replica doesn't exist" when removing all replicas [from a database]
+$CLICKHOUSE_CLIENT -q "system drop database replica 'doesntexist$CLICKHOUSE_DATABASE' from shard 'doesntexist'"
+
 $CLICKHOUSE_CLIENT -q "drop database $db"
 $CLICKHOUSE_CLIENT -q "drop database $db2"
 $CLICKHOUSE_CLIENT -q "drop database $db3"
+
+$CLICKHOUSE_CLIENT --distributed_ddl_output_mode=none -q "create table $db4.rmt (n int) engine=ReplicatedMergeTree order by n"
+$CLICKHOUSE_CLIENT -q "system drop replica 'doesntexist$CLICKHOUSE_DATABASE' from database $db4"
+$CLICKHOUSE_CLIENT -q "system drop replica 'doesntexist$CLICKHOUSE_DATABASE'"
+
 $CLICKHOUSE_CLIENT -q "drop database $db4"
diff --git a/tests/queries/0_stateless/02457_bz2_concatenated.sh b/tests/queries/0_stateless/02457_bz2_concatenated.sh
index 5b24f74b9c0..96e23cbfa2a 100755
--- a/tests/queries/0_stateless/02457_bz2_concatenated.sh
+++ b/tests/queries/0_stateless/02457_bz2_concatenated.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 WORKING_FOLDER_02457="${USER_FILES_PATH}/${CLICKHOUSE_DATABASE}"
 
 rm -rf "${WORKING_FOLDER_02457}"
diff --git a/tests/queries/0_stateless/02459_glob_for_recursive_directory_traversal.sh b/tests/queries/0_stateless/02459_glob_for_recursive_directory_traversal.sh
index 2c3deda2328..b8430307ea3 100755
--- a/tests/queries/0_stateless/02459_glob_for_recursive_directory_traversal.sh
+++ b/tests/queries/0_stateless/02459_glob_for_recursive_directory_traversal.sh
@@ -5,7 +5,7 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir $user_files_path/d1
 touch $user_files_path/d1/text1.txt
@@ -40,4 +40,4 @@ rmdir $user_files_path/d1/d2/d3
 rm $user_files_path/d1/d2/text2.txt
 rmdir $user_files_path/d1/d2
 rm $user_files_path/d1/text1.txt
-rmdir $user_files_path/d1
\ No newline at end of file
+rmdir $user_files_path/d1
diff --git a/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.reference b/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.reference
index 84589668d64..ff5f7e5a687 100644
--- a/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.reference
+++ b/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.reference
@@ -36,6 +36,42 @@ QUERY id: 0
   SETTINGS allow_experimental_analyzer=1
 SELECT a
 FROM t_logical_expressions_optimizer_low_cardinality
+WHERE (a != \'x\') AND (a != \'y\')
+QUERY id: 0
+  PROJECTION COLUMNS
+    a LowCardinality(String)
+  PROJECTION
+    LIST id: 1, nodes: 1
+      COLUMN id: 2, column_name: a, result_type: LowCardinality(String), source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.t_logical_expressions_optimizer_low_cardinality
+  WHERE
+    FUNCTION id: 4, function_name: notIn, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 5, nodes: 2
+          COLUMN id: 2, column_name: a, result_type: LowCardinality(String), source_id: 3
+          CONSTANT id: 6, constant_value: Tuple_(\'x\', \'y\'), constant_value_type: Tuple(String, String)
+  SETTINGS allow_experimental_analyzer=1
+SELECT a
+FROM t_logical_expressions_optimizer_low_cardinality
+WHERE (a != \'x\') AND (\'y\' != a)
+QUERY id: 0
+  PROJECTION COLUMNS
+    a LowCardinality(String)
+  PROJECTION
+    LIST id: 1, nodes: 1
+      COLUMN id: 2, column_name: a, result_type: LowCardinality(String), source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.t_logical_expressions_optimizer_low_cardinality
+  WHERE
+    FUNCTION id: 4, function_name: notIn, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 5, nodes: 2
+          COLUMN id: 2, column_name: a, result_type: LowCardinality(String), source_id: 3
+          CONSTANT id: 6, constant_value: Tuple_(\'x\', \'y\'), constant_value_type: Tuple(String, String)
+  SETTINGS allow_experimental_analyzer=1
+SELECT a
+FROM t_logical_expressions_optimizer_low_cardinality
 WHERE (b = 0) OR (b = 1)
 QUERY id: 0
   PROJECTION COLUMNS
@@ -60,3 +96,29 @@ QUERY id: 0
                 COLUMN id: 8, column_name: b, result_type: UInt32, source_id: 3
                 CONSTANT id: 12, constant_value: UInt64_1, constant_value_type: UInt8
   SETTINGS allow_experimental_analyzer=1
+SELECT a
+FROM t_logical_expressions_optimizer_low_cardinality
+WHERE (b != 0) AND (b != 1)
+QUERY id: 0
+  PROJECTION COLUMNS
+    a LowCardinality(String)
+  PROJECTION
+    LIST id: 1, nodes: 1
+      COLUMN id: 2, column_name: a, result_type: LowCardinality(String), source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.t_logical_expressions_optimizer_low_cardinality
+  WHERE
+    FUNCTION id: 4, function_name: and, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 5, nodes: 2
+          FUNCTION id: 6, function_name: notEquals, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 7, nodes: 2
+                COLUMN id: 8, column_name: b, result_type: UInt32, source_id: 3
+                CONSTANT id: 9, constant_value: UInt64_0, constant_value_type: UInt8
+          FUNCTION id: 10, function_name: notEquals, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 11, nodes: 2
+                COLUMN id: 8, column_name: b, result_type: UInt32, source_id: 3
+                CONSTANT id: 12, constant_value: UInt64_1, constant_value_type: UInt8
+  SETTINGS allow_experimental_analyzer=1
diff --git a/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.sql b/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.sql
index 14f8ad830e7..976b21a7e29 100644
--- a/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.sql
+++ b/tests/queries/0_stateless/02477_logical_expressions_optimizer_low_cardinality.sql
@@ -2,13 +2,24 @@ DROP TABLE IF EXISTS t_logical_expressions_optimizer_low_cardinality;
 set optimize_min_equality_disjunction_chain_length=3;
 CREATE TABLE t_logical_expressions_optimizer_low_cardinality (a LowCardinality(String), b UInt32) ENGINE = Memory;
 
--- LowCardinality case, ignore optimize_min_equality_disjunction_chain_length limit, optimzer applied
+-- LowCardinality case, ignore optimize_min_equality_disjunction_chain_length limit, optimizer applied
+-- Chain of OR equals
 EXPLAIN SYNTAX SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a = 'x' OR a = 'y';
 EXPLAIN QUERY TREE SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a = 'x' OR a = 'y' SETTINGS allow_experimental_analyzer = 1;
 EXPLAIN SYNTAX SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a = 'x' OR 'y' = a;
 EXPLAIN QUERY TREE SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a = 'x' OR 'y' = a SETTINGS allow_experimental_analyzer = 1;
+-- Chain of AND notEquals
+EXPLAIN SYNTAX SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a <> 'x' AND a <> 'y';
+EXPLAIN QUERY TREE SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a <> 'x' AND a <> 'y' SETTINGS allow_experimental_analyzer = 1;
+EXPLAIN SYNTAX SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a <> 'x' AND 'y' <> a;
+EXPLAIN QUERY TREE SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE a <> 'x' AND 'y' <> a SETTINGS allow_experimental_analyzer = 1;
+
 -- Non-LowCardinality case, optimizer not applied for short chains
+-- Chain of OR equals
 EXPLAIN SYNTAX SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE b = 0 OR b = 1;
 EXPLAIN QUERY TREE SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE b = 0 OR b = 1 SETTINGS allow_experimental_analyzer = 1;
+-- Chain of AND notEquals
+EXPLAIN SYNTAX SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE b <> 0 AND b <> 1;
+EXPLAIN QUERY TREE SELECT a FROM t_logical_expressions_optimizer_low_cardinality WHERE b <> 0 AND b <> 1 SETTINGS allow_experimental_analyzer = 1;
 
 DROP TABLE t_logical_expressions_optimizer_low_cardinality;
diff --git a/tests/queries/0_stateless/02479_race_condition_between_insert_and_droppin_mv.sh b/tests/queries/0_stateless/02479_race_condition_between_insert_and_droppin_mv.sh
index 5d9844d5030..9ce4b459fce 100755
--- a/tests/queries/0_stateless/02479_race_condition_between_insert_and_droppin_mv.sh
+++ b/tests/queries/0_stateless/02479_race_condition_between_insert_and_droppin_mv.sh
@@ -42,7 +42,7 @@ TIMEOUT=55
 
 for i in {1..4}
 do
-    timeout $TIMEOUT bash -c drop_mv $i &
+    timeout $TIMEOUT bash -c "drop_mv $i" &
 done
 
 for i in {1..4}
diff --git a/tests/queries/0_stateless/02480_max_map_null_totals.reference b/tests/queries/0_stateless/02480_max_map_null_totals.reference
index 5cc9b5a495f..8fa02ad2a39 100644
--- a/tests/queries/0_stateless/02480_max_map_null_totals.reference
+++ b/tests/queries/0_stateless/02480_max_map_null_totals.reference
@@ -1,119 +1,119 @@
 ([-1,0],[0,0])
-([1,2],[0,2])
 ([0,1],[0,1])
+([1,2],[0,2])
 
-([-1,0,1,2],[0,0,0,2])
+([-1,0,1,2],[0,0,1,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
 ([0,1],[0,1])
+([1,2],[0,2])
 
-([-1,0,1,2],[0,0,0,2])
+([-1,0,1,2],[0,0,1,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([0],[0])
-([2],[2])
 ([1],[1])
+([2],[2])
 
-([0,2],[0,2])
+([0,1,2],[0,1,2])
 ([0],[0])
-([2],[2])
+([0,1,2],[0,1,2])
 ([1],[1])
-([0,2],[0,2])
+([2],[2])
 ([0],[0])
-([2],[2])
+([0,1,2],[0,1,2])
 ([1],[1])
-([0,2],[0,2])
+([2],[2])
 -
 ([-1,0],[0,0])
-([1,2],[0,2])
 ([0,1],[0,1])
+([1,2],[0,2])
 
-([-1,0,1,2],[0,0,0,2])
+([-1,0,1,2],[0,0,1,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
 ([0,1],[0,1])
+([1,2],[0,2])
 
-([-1,0,1,2],[0,0,0,2])
+([-1,0,1,2],[0,0,1,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([0],[0])
-([2],[2])
 ([1],[1])
+([2],[2])
 
-([0,2],[0,2])
+([0,1,2],[0,1,2])
 ([0],[0])
-([2],[2])
+([0,1,2],[0,1,2])
 ([1],[1])
-([0,2],[0,2])
+([2],[2])
 ([0],[0])
-([2],[2])
+([0,1,2],[0,1,2])
 ([1],[1])
-([0,2],[0,2])
+([2],[2])
 -
 ([-1,0],[0,0])
-([1,2],[0,2])
 ([0,1],[0,1])
+([1,2],[0,2])
 
-([-1,0,1,2],[0,0,0,2])
+([-1,0,1,2],[0,0,1,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
 ([0,1],[0,1])
+([1,2],[0,2])
 
-([-1,0,1,2],[0,0,0,2])
+([-1,0,1,2],[0,0,1,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([-1,0],[0,0])
-([1,2],[0,2])
+([-1,0,1,2],[0,0,1,2])
 ([0,1],[0,1])
-([-1,0,1,2],[0,0,0,2])
+([1,2],[0,2])
 ([0],[0])
-([2],[2])
 ([1],[1])
+([2],[2])
 
-([0,2],[0,2])
+([0,1,2],[0,1,2])
 ([0],[0])
-([2],[2])
+([0,1,2],[0,1,2])
 ([1],[1])
-([0,2],[0,2])
+([2],[2])
 ([0],[0])
-([2],[2])
+([0,1,2],[0,1,2])
 ([1],[1])
-([0,2],[0,2])
+([2],[2])
diff --git a/tests/queries/0_stateless/02480_max_map_null_totals.sql b/tests/queries/0_stateless/02480_max_map_null_totals.sql
index 81e2a5c4243..be2c566ddc1 100644
--- a/tests/queries/0_stateless/02480_max_map_null_totals.sql
+++ b/tests/queries/0_stateless/02480_max_map_null_totals.sql
@@ -1,39 +1,39 @@
-SELECT maxMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT maxMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT maxMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT maxMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT maxMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT maxMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
-SELECT minMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT minMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT minMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT minMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT minMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT minMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
-SELECT sumMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT sumMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT sumMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT sumMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT sumMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT sumMap([number % 3, number % 4 - 1], [number, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
 SELECT '-';
 
-SELECT maxMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT maxMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT maxMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT maxMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT maxMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT maxMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
-SELECT minMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT minMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT minMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT minMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT minMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT minMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
-SELECT sumMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT sumMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT sumMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT sumMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT sumMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT sumMap([number % 3, number % 4 - 1], [number :: Float64, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
 SELECT '-';
 
-SELECT maxMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT maxMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT maxMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT maxMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT maxMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT maxMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
-SELECT minMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT minMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT minMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT minMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT minMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT minMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
 
-SELECT sumMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS;
-SELECT sumMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP;
-SELECT sumMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH CUBE;
+SELECT sumMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH TOTALS ORDER BY number;
+SELECT sumMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH ROLLUP ORDER BY number;
+SELECT sumMap([number % 3, number % 4 - 1], [number :: UInt256, NULL]) FROM numbers(3) GROUP BY number WITH CUBE ORDER BY number;
diff --git a/tests/queries/0_stateless/02481_analyzer_optimize_grouping_sets_keys.sql b/tests/queries/0_stateless/02481_analyzer_optimize_grouping_sets_keys.sql
index de9208ef009..fef71fdf94f 100644
--- a/tests/queries/0_stateless/02481_analyzer_optimize_grouping_sets_keys.sql
+++ b/tests/queries/0_stateless/02481_analyzer_optimize_grouping_sets_keys.sql
@@ -1,4 +1,5 @@
 set allow_experimental_analyzer = 1;
+set optimize_syntax_fuse_functions = 0;
 
 EXPLAIN QUERY TREE run_passes=1
 SELECT avg(log(2) * number) AS k FROM numbers(10000000)
diff --git a/tests/queries/0_stateless/02482_capnp_list_of_structs.sh b/tests/queries/0_stateless/02482_capnp_list_of_structs.sh
index 091bd4dba2a..9d78b9893dd 100755
--- a/tests/queries/0_stateless/02482_capnp_list_of_structs.sh
+++ b/tests/queries/0_stateless/02482_capnp_list_of_structs.sh
@@ -5,10 +5,10 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 touch $USER_FILES_PATH/data.capnp
 
-SCHEMADIR=$(clickhouse-client --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
+SCHEMADIR=$($CLICKHOUSE_CLIENT_BINARY --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
 CLIENT_SCHEMADIR=$CURDIR/format_schemas
 SERVER_SCHEMADIR=test_02482
 mkdir -p $SCHEMADIR/$SERVER_SCHEMADIR
diff --git a/tests/queries/0_stateless/02483_capnp_decimals.sh b/tests/queries/0_stateless/02483_capnp_decimals.sh
index bdfa9dac3d5..ef545a5539f 100755
--- a/tests/queries/0_stateless/02483_capnp_decimals.sh
+++ b/tests/queries/0_stateless/02483_capnp_decimals.sh
@@ -5,10 +5,10 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 touch $USER_FILES_PATH/data.capnp
 
-SCHEMADIR=$(clickhouse-client --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
+SCHEMADIR=$($CLICKHOUSE_CLIENT_BINARY --query "select * from file('data.capnp', 'CapnProto', 'val1 char') settings format_schema='nonexist:Message'" 2>&1 | grep Exception | grep -oP "file \K.*(?=/nonexist.capnp)")
 CLIENT_SCHEMADIR=$CURDIR/format_schemas
 SERVER_SCHEMADIR=test_02483
 mkdir -p $SCHEMADIR/$SERVER_SCHEMADIR
@@ -21,4 +21,3 @@ $CLICKHOUSE_CLIENT -q "select * from file(02483_data.capnp, auto, 'decimal64 Dec
 
 rm $USER_FILES_PATH/data.capnp
 rm $USER_FILES_PATH/02483_data.capnp
-
diff --git a/tests/queries/0_stateless/02483_test_reverse_dns_resolution.reference b/tests/queries/0_stateless/02483_test_reverse_dns_resolution.reference
deleted file mode 100644
index 2bae467069f..00000000000
--- a/tests/queries/0_stateless/02483_test_reverse_dns_resolution.reference
+++ /dev/null
@@ -1,14 +0,0 @@
--- { echoOn }
--- Expect dns.google on both queries
-select reverseDNSQuery('8.8.8.8');
-['dns.google']
-select reverseDNSQuery('2001:4860:4860::8888');
-['dns.google']
--- Expect empty response
-select reverseDNSQuery('');
-[]
--- Expect error, invalid column type
-select reverseDNSQuery(1); -- {serverError 36}
--- Expect error, wrong number of arguments
-select reverseDNSQuery(); -- {serverError 42}
-select reverseDNSQuery(1, 2); -- {serverError 42}
diff --git a/tests/queries/0_stateless/02483_test_reverse_dns_resolution.sql b/tests/queries/0_stateless/02483_test_reverse_dns_resolution.sql
deleted file mode 100644
index d9576c0641a..00000000000
--- a/tests/queries/0_stateless/02483_test_reverse_dns_resolution.sql
+++ /dev/null
@@ -1,14 +0,0 @@
--- { echoOn }
--- Expect dns.google on both queries
-select reverseDNSQuery('8.8.8.8');
-select reverseDNSQuery('2001:4860:4860::8888');
-
--- Expect empty response
-select reverseDNSQuery('');
-
--- Expect error, invalid column type
-select reverseDNSQuery(1); -- {serverError 36}
-
--- Expect error, wrong number of arguments
-select reverseDNSQuery(); -- {serverError 42}
-select reverseDNSQuery(1, 2); -- {serverError 42}
diff --git a/tests/queries/0_stateless/02487_create_index_normalize_functions.reference b/tests/queries/0_stateless/02487_create_index_normalize_functions.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02487_create_index_normalize_functions.sql b/tests/queries/0_stateless/02487_create_index_normalize_functions.sql
new file mode 100644
index 00000000000..2155f5d6665
--- /dev/null
+++ b/tests/queries/0_stateless/02487_create_index_normalize_functions.sql
@@ -0,0 +1,6 @@
+
+create table rmt (n int, ts DateTime64(8, 'UTC')) engine=ReplicatedMergeTree('/test/02487/{database}/rmt', '1') order by n;
+alter table rmt add index idx1 date(ts) TYPE MinMax GRANULARITY 1;
+create index idx2 on rmt date(ts) TYPE MinMax GRANULARITY 1;
+system restart replica rmt;
+create table rmt2 (n int, ts DateTime64(8, 'UTC'), index idx1 date(ts) TYPE MinMax GRANULARITY 1, index idx2 date(ts) TYPE MinMax GRANULARITY 1) engine=ReplicatedMergeTree('/test/02487/{database}/rmt', '2') order by n;
diff --git a/tests/queries/0_stateless/02488_zero_copy_detached_parts_drop_table.reference b/tests/queries/0_stateless/02488_zero_copy_detached_parts_drop_table.reference
new file mode 100644
index 00000000000..00c825f598a
--- /dev/null
+++ b/tests/queries/0_stateless/02488_zero_copy_detached_parts_drop_table.reference
@@ -0,0 +1,3 @@
+0
+broken-on-start	broken-on-start_all_0_0_0
+42
diff --git a/tests/queries/0_stateless/02488_zero_copy_detached_parts_drop_table.sh b/tests/queries/0_stateless/02488_zero_copy_detached_parts_drop_table.sh
new file mode 100755
index 00000000000..b01f16e1cad
--- /dev/null
+++ b/tests/queries/0_stateless/02488_zero_copy_detached_parts_drop_table.sh
@@ -0,0 +1,30 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, zookeeper
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_CLIENT -q "create table rmt1 (n int) engine=ReplicatedMergeTree('/test/02488/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX', '1') order by n
+  settings min_bytes_for_wide_part=0, allow_remote_fs_zero_copy_replication=1, storage_policy='s3_cache'"
+$CLICKHOUSE_CLIENT -q "create table rmt2 (n int) engine=ReplicatedMergeTree('/test/02488/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX', '2') order by n
+  settings min_bytes_for_wide_part=0, allow_remote_fs_zero_copy_replication=1, storage_policy='s3_cache'"
+
+$CLICKHOUSE_CLIENT --insert_keeper_fault_injection_probability=0 -q "insert into rmt2 values (42)"
+$CLICKHOUSE_CLIENT -q "system sync replica rmt1"
+
+path=$($CLICKHOUSE_CLIENT -q "select path from system.parts where database='$CLICKHOUSE_DATABASE' and table='rmt2' and name='all_0_0_0'")
+# ensure that path is absolute before removing
+$CLICKHOUSE_CLIENT -q "select throwIf(substring('$path', 1, 1) != '/', 'Path is relative: $path')" || exit
+rm -f $path/count.txt
+
+$CLICKHOUSE_CLIENT -q "detach table rmt2 sync"
+$CLICKHOUSE_CLIENT --send_logs_level='fatal' -q "attach table rmt2"
+
+$CLICKHOUSE_CLIENT -q "select reason, name from system.detached_parts where database='$CLICKHOUSE_DATABASE' and table='rmt2'"
+
+$CLICKHOUSE_CLIENT -q "drop table rmt2 sync"
+
+$CLICKHOUSE_CLIENT -q "select * from rmt1"
+
+$CLICKHOUSE_CLIENT -q "drop table rmt1"
diff --git a/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.reference b/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.reference
index 04a2b75bb4f..c897004b4e3 100644
--- a/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.reference
+++ b/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.reference
@@ -91,6 +91,28 @@ d4	1	0
 == (Replicas) Test settings ==
 c2	1	0
 c4	1	0
+no cleanup 1	d1	5	0
+no cleanup 1	d2	1	0
+no cleanup 1	d3	1	0
+no cleanup 1	d4	3	0
+no cleanup 1	d5	1	0
+no cleanup 2	d1	5	0
+no cleanup 2	d2	1	0
+no cleanup 2	d3	1	0
+no cleanup 2	d4	3	0
+no cleanup 2	d5	1	0
+no cleanup 2	d6	2	1
+no cleanup 3	d1	5	0
+no cleanup 3	d2	1	0
+no cleanup 3	d3	1	0
+no cleanup 3	d4	3	0
+no cleanup 3	d5	1	0
+no cleanup 4	d1	5	0
+no cleanup 4	d2	1	0
+no cleanup 4	d3	1	0
+no cleanup 4	d4	3	0
+no cleanup 4	d5	1	0
+no cleanup 4	d6	2	1
 == Check cleanup & settings for other merge trees ==
 d1	1	1
 d1	1	1
diff --git a/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.sql b/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.sql
index 8549300d49f..80c18ae308b 100644
--- a/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.sql
+++ b/tests/queries/0_stateless/02490_replacing_merge_tree_is_deleted_column.sql
@@ -5,7 +5,7 @@ set allow_deprecated_syntax_for_merge_tree=0;
 
 -- Test the bahaviour without the is_deleted column
 DROP TABLE IF EXISTS test;
-CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version) Order by (uid);
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version) Order by (uid) settings allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO test (*) VALUES ('d1', 1, 0), ('d2', 1, 0), ('d6', 1, 0), ('d4', 1, 0), ('d6', 2, 1), ('d3', 1, 0), ('d1', 2, 1), ('d5', 1, 0), ('d4', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d4', 3, 0), ('d1', 5, 0);
 SELECT '== Test SELECT ... FINAL - no is_deleted ==';
 select * from test FINAL order by uid;
@@ -13,7 +13,7 @@ OPTIMIZE TABLE test FINAL CLEANUP;
 select * from test order by uid;
 
 DROP TABLE IF EXISTS test;
-CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version) Order by (uid) SETTINGS clean_deleted_rows='Always';
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version) Order by (uid) SETTINGS clean_deleted_rows='Always', allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO test (*) VALUES ('d1', 1, 0), ('d2', 1, 0), ('d6', 1, 0), ('d4', 1, 0), ('d6', 2, 1), ('d3', 1, 0), ('d1', 2, 1), ('d5', 1, 0), ('d4', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d4', 3, 0), ('d1', 5, 0);
 SELECT '== Test SELECT ... FINAL - no is_deleted SETTINGS clean_deleted_rows=Always ==';
 select * from test FINAL order by uid;
@@ -22,7 +22,7 @@ select * from test order by uid;
 
 -- Test the new behaviour
 DROP TABLE IF EXISTS test;
-CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid);
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid) settings allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO test (*) VALUES ('d1', 1, 0), ('d2', 1, 0), ('d6', 1, 0), ('d4', 1, 0), ('d6', 2, 1), ('d3', 1, 0), ('d1', 2, 1), ('d5', 1, 0), ('d4', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d4', 3, 0), ('d1', 5, 0);
 SELECT '== Test SELECT ... FINAL ==';
 select * from test FINAL order by uid;
@@ -37,7 +37,7 @@ INSERT INTO test (*) VALUES ('d4', 1, 0), ('d6', 2, 1), ('d3', 1, 0), ('d1', 2,
 select * from test FINAL order by uid;
 
 DROP TABLE IF EXISTS test;
-CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid);
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid) settings allow_experimental_replacing_merge_with_cleanup=1;
 
 -- Expect d6 to be version=3 is_deleted=false
 INSERT INTO test (*) VALUES ('d1', 1, 0), ('d1', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d1', 5, 0), ('d2', 1, 0), ('d3', 1, 0), ('d4', 1, 0),  ('d5', 1, 0), ('d6', 1, 0), ('d6', 3, 0);
@@ -56,7 +56,7 @@ OPTIMIZE TABLE test FINAL CLEANUP;
 select * from test order by uid;
 
 DROP TABLE IF EXISTS test;
-CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid) SETTINGS clean_deleted_rows='Always';
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid) SETTINGS clean_deleted_rows='Always', allow_experimental_replacing_merge_with_cleanup=1;
 
 SELECT '== Test of the SETTINGS clean_deleted_rows as Always ==';
 INSERT INTO test (*) VALUES ('d1', 1, 0), ('d2', 1, 0), ('d6', 1, 0), ('d4', 1, 0), ('d6', 2, 1), ('d3', 1, 0), ('d1', 2, 1), ('d5', 1, 0), ('d4', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d4', 3, 0), ('d1', 5, 0);
@@ -66,7 +66,7 @@ select * from test order by uid;
 
 OPTIMIZE TABLE test FINAL;
 -- d6 has to be removed since we set clean_deleted_rows as 'Always'
-select * from test order by uid;
+select * from test where is_deleted=0 order by uid;
 
 SELECT '== Test of the SETTINGS clean_deleted_rows as Never ==';
 ALTER TABLE test MODIFY SETTING clean_deleted_rows='Never';
@@ -80,7 +80,7 @@ DROP TABLE IF EXISTS testCleanupR1;
 
 CREATE TABLE testCleanupR1 (uid String, version UInt32, is_deleted UInt8)
     ENGINE = ReplicatedReplacingMergeTree('/clickhouse/{database}/tables/test_cleanup/', 'r1', version, is_deleted)
-    ORDER BY uid;
+    ORDER BY uid settings allow_experimental_replacing_merge_with_cleanup=1;
 
 
 INSERT INTO testCleanupR1 (*) VALUES ('d1', 1, 0),('d2', 1, 0),('d3', 1, 0),('d4', 1, 0);
@@ -101,7 +101,7 @@ DROP TABLE IF EXISTS testSettingsR1;
 CREATE TABLE testSettingsR1 (col1 String, version UInt32, is_deleted UInt8)
     ENGINE = ReplicatedReplacingMergeTree('/clickhouse/{database}/tables/test_setting/', 'r1', version, is_deleted)
     ORDER BY col1
-    SETTINGS clean_deleted_rows = 'Always';
+    SETTINGS clean_deleted_rows = 'Always', allow_experimental_replacing_merge_with_cleanup=1;
 
 INSERT INTO testSettingsR1 (*) VALUES ('c1', 1, 1),('c2', 1, 0),('c3', 1, 1),('c4', 1, 0);
 SYSTEM SYNC REPLICA testSettingsR1; -- Avoid "Cannot select parts for optimization: Entry for part all_2_2_0 hasn't been read from the replication log yet"
@@ -110,13 +110,13 @@ OPTIMIZE TABLE testSettingsR1 FINAL;
 
 -- Only d3 to d5 remain
 SELECT '== (Replicas) Test settings ==';
-SELECT * FROM testSettingsR1 order by col1;
+SELECT * FROM testSettingsR1 where is_deleted=0 order by col1;
 
 
 ------------------------------
 -- Check errors
 DROP TABLE IF EXISTS test;
-CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid);
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid) settings allow_experimental_replacing_merge_with_cleanup=1;
 
 -- is_deleted == 0/1
 INSERT INTO test (*) VALUES ('d1', 1, 2); -- { serverError INCORRECT_DATA }
@@ -125,35 +125,49 @@ DROP TABLE IF EXISTS test;
 -- checkis_deleted type
 CREATE TABLE test (uid String, version UInt32, is_deleted String) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid); -- { serverError BAD_TYPE_OF_FIELD }
 
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid);
+INSERT INTO test (*) VALUES ('d1', 1, 0), ('d2', 1, 0), ('d6', 1, 0), ('d4', 1, 0), ('d6', 2, 1), ('d3', 1, 0), ('d1', 2, 1), ('d5', 1, 0), ('d4', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d4', 3, 0), ('d1', 5, 0);
+select 'no cleanup 1', * from test FINAL order by uid;
+OPTIMIZE TABLE test FINAL CLEANUP; -- { serverError SUPPORT_IS_DISABLED }
+select 'no cleanup 2', * from test order by uid;
+DROP TABLE test;
+
+CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplicatedReplacingMergeTree('/clickhouse/{database}/tables/no_cleanup/', 'r1', version, is_deleted) Order by (uid);
+INSERT INTO test (*) VALUES ('d1', 1, 0), ('d2', 1, 0), ('d6', 1, 0), ('d4', 1, 0), ('d6', 2, 1), ('d3', 1, 0), ('d1', 2, 1), ('d5', 1, 0), ('d4', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d4', 3, 0), ('d1', 5, 0);
+select 'no cleanup 3', * from test FINAL order by uid;
+OPTIMIZE TABLE test FINAL CLEANUP; -- { serverError SUPPORT_IS_DISABLED }
+select 'no cleanup 4', * from test order by uid;
+DROP TABLE test;
+
 -- is_deleted column for other mergeTrees - ErrorCodes::LOGICAL_ERROR)
 
 -- Check clean_deleted_rows='Always' for other MergeTrees
 SELECT '== Check cleanup & settings for other merge trees ==';
-CREATE TABLE testMT (uid String, version UInt32, is_deleted UInt8) ENGINE = MergeTree() Order by (uid) SETTINGS clean_deleted_rows='Always';
+CREATE TABLE testMT (uid String, version UInt32, is_deleted UInt8) ENGINE = MergeTree() Order by (uid) SETTINGS clean_deleted_rows='Always', allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO testMT (*) VALUES ('d1', 1, 1);
 OPTIMIZE TABLE testMT FINAL CLEANUP;  -- { serverError CANNOT_ASSIGN_OPTIMIZE }
 OPTIMIZE TABLE testMT FINAL;
 SELECT * FROM testMT order by uid;
 
-CREATE TABLE testSummingMT (uid String, version UInt32, is_deleted UInt8) ENGINE = SummingMergeTree() Order by (uid) SETTINGS clean_deleted_rows='Always';
+CREATE TABLE testSummingMT (uid String, version UInt32, is_deleted UInt8) ENGINE = SummingMergeTree() Order by (uid) SETTINGS clean_deleted_rows='Always', allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO testSummingMT (*) VALUES ('d1', 1, 1);
 OPTIMIZE TABLE testSummingMT FINAL CLEANUP;  -- { serverError CANNOT_ASSIGN_OPTIMIZE }
 OPTIMIZE TABLE testSummingMT FINAL;
 SELECT * FROM testSummingMT order by uid;
 
-CREATE TABLE testAggregatingMT (uid String, version UInt32, is_deleted UInt8) ENGINE = AggregatingMergeTree() Order by (uid) SETTINGS clean_deleted_rows='Always';
+CREATE TABLE testAggregatingMT (uid String, version UInt32, is_deleted UInt8) ENGINE = AggregatingMergeTree() Order by (uid) SETTINGS clean_deleted_rows='Always', allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO testAggregatingMT (*) VALUES ('d1', 1, 1);
 OPTIMIZE TABLE testAggregatingMT FINAL CLEANUP;  -- { serverError CANNOT_ASSIGN_OPTIMIZE }
 OPTIMIZE TABLE testAggregatingMT FINAL;
 SELECT * FROM testAggregatingMT order by uid;
 
-CREATE TABLE testCollapsingMT (uid String, version UInt32, is_deleted UInt8, sign Int8) ENGINE = CollapsingMergeTree(sign) Order by (uid) SETTINGS clean_deleted_rows='Always';
+CREATE TABLE testCollapsingMT (uid String, version UInt32, is_deleted UInt8, sign Int8) ENGINE = CollapsingMergeTree(sign) Order by (uid) SETTINGS clean_deleted_rows='Always', allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO testCollapsingMT (*) VALUES ('d1', 1, 1, 1);
 OPTIMIZE TABLE testCollapsingMT FINAL CLEANUP;  -- { serverError CANNOT_ASSIGN_OPTIMIZE }
 OPTIMIZE TABLE testCollapsingMT FINAL;
 SELECT * FROM testCollapsingMT order by uid;
 
-CREATE TABLE testVersionedCMT (uid String, version UInt32, is_deleted UInt8, sign Int8) ENGINE = VersionedCollapsingMergeTree(sign, version) Order by (uid) SETTINGS clean_deleted_rows='Always';
+CREATE TABLE testVersionedCMT (uid String, version UInt32, is_deleted UInt8, sign Int8) ENGINE = VersionedCollapsingMergeTree(sign, version) Order by (uid) SETTINGS clean_deleted_rows='Always', allow_experimental_replacing_merge_with_cleanup=1;
 INSERT INTO testVersionedCMT (*) VALUES ('d1', 1, 1, 1);
 OPTIMIZE TABLE testVersionedCMT FINAL CLEANUP;  -- { serverError CANNOT_ASSIGN_OPTIMIZE }
 OPTIMIZE TABLE testVersionedCMT FINAL;
diff --git a/tests/queries/0_stateless/02493_numeric_literals_with_underscores.sql b/tests/queries/0_stateless/02493_numeric_literals_with_underscores.sql
index a0042fac4c4..af8eb77e92c 100644
--- a/tests/queries/0_stateless/02493_numeric_literals_with_underscores.sql
+++ b/tests/queries/0_stateless/02493_numeric_literals_with_underscores.sql
@@ -131,7 +131,7 @@ select _1000; -- { serverError UNKNOWN_IDENTIFIER }
 select _1000 FROM (SELECT 1 AS _1000) FORMAT Null;
 select -_1; -- { serverError UNKNOWN_IDENTIFIER }
 select -_1 FROM (SELECT -1 AS _1) FORMAT Null;
-select +_1; -- { clientError SYNTAX_ERROR }
+select +_1; -- { serverError UNKNOWN_IDENTIFIER }
 select 1__0; -- { serverError UNKNOWN_IDENTIFIER }
 select 1_; -- { serverError UNKNOWN_IDENTIFIER }
 select 1_ ; -- { serverError UNKNOWN_IDENTIFIER }
diff --git a/tests/queries/0_stateless/02494_analyzer_compound_expression_crash_fix.sql b/tests/queries/0_stateless/02494_analyzer_compound_expression_crash_fix.sql
index 4eef7792180..b8d43acbef2 100644
--- a/tests/queries/0_stateless/02494_analyzer_compound_expression_crash_fix.sql
+++ b/tests/queries/0_stateless/02494_analyzer_compound_expression_crash_fix.sql
@@ -3,7 +3,7 @@ SET allow_experimental_analyzer = 1;
 DROP TABLE IF EXISTS test_table;
 CREATE TABLE test_table (
     fingerprint UInt16,
-    fields Array(Tuple(name Array(UInt32), value String))
+    fields Nested(name Array(UInt32), value String)
 ) ENGINE = MergeTree
 ORDER BY fingerprint;
 
diff --git a/tests/queries/0_stateless/02496_remove_redundant_sorting.reference b/tests/queries/0_stateless/02496_remove_redundant_sorting.reference
index b318157835d..e7c169cf45e 100644
--- a/tests/queries/0_stateless/02496_remove_redundant_sorting.reference
+++ b/tests/queries/0_stateless/02496_remove_redundant_sorting.reference
@@ -113,27 +113,26 @@ FROM
     )
     ORDER BY number DESC
 ) AS t2
+ORDER BY t1.number, t2.number
 -- explain
-Expression ((Projection + Before ORDER BY))
-  Join (JOIN FillRightFirst)
-    Expression ((Before JOIN + Projection))
-      Sorting (Sorting for ORDER BY)
-        Expression ((Before ORDER BY + (Projection + Before ORDER BY)))
+Expression (Projection)
+  Sorting (Sorting for ORDER BY)
+    Expression (Before ORDER BY)
+      Join (JOIN FillRightFirst)
+        Expression ((Before JOIN + (Projection + (Before ORDER BY + (Projection + Before ORDER BY)))))
           ReadFromSystemNumbers
-    Expression ((Joined actions + (Rename joined columns + Projection)))
-      Sorting (Sorting for ORDER BY)
-        Expression ((Before ORDER BY + (Projection + Before ORDER BY)))
+        Expression ((Joined actions + (Rename joined columns + (Projection + (Before ORDER BY + (Projection + Before ORDER BY))))))
           ReadFromSystemNumbers
 -- execute
-0	2
-0	1
 0	0
-1	2
-1	1
+0	1
+0	2
 1	0
-2	2
-2	1
+1	1
+1	2
 2	0
+2	1
+2	2
 -- CROSS JOIN with subqueries, ORDER BY in main query -> all ORDER BY clauses will be removed in subqueries
 -- query
 SELECT *
@@ -193,15 +192,18 @@ FROM
     ORDER BY number DESC
 )
 GROUP BY number
+ORDER BY number
 -- explain
-Expression ((Projection + Before ORDER BY))
-  Aggregating
-    Expression ((Before GROUP BY + (Projection + (Before ORDER BY + (Projection + Before ORDER BY)))))
-      ReadFromSystemNumbers
+Expression (Projection)
+  Sorting (Sorting for ORDER BY)
+    Expression (Before ORDER BY)
+      Aggregating
+        Expression ((Before GROUP BY + (Projection + (Before ORDER BY + (Projection + Before ORDER BY)))))
+          ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 -- GROUP BY with aggregation function which depends on order -> keep ORDER BY in first subquery, and eliminate in second subquery
 -- query
 SELECT any(number)
@@ -217,15 +219,18 @@ FROM
     ORDER BY number DESC
 )
 GROUP BY number
+ORDER BY number
 -- explain
-Expression ((Projection + Before ORDER BY))
-  Aggregating
-    Expression ((Before GROUP BY + (Projection + (Before ORDER BY + (Projection + Before ORDER BY)))))
-      ReadFromSystemNumbers
+Expression (Projection)
+  Sorting (Sorting for ORDER BY)
+    Expression (Before ORDER BY)
+      Aggregating
+        Expression ((Before GROUP BY + (Projection + (Before ORDER BY + (Projection + Before ORDER BY)))))
+          ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 -- query with aggregation function but w/o GROUP BY -> remove sorting
 -- query
 SELECT sum(number)
@@ -315,15 +320,18 @@ FROM
     GROUP BY number
 )
 WHERE a > 0
+ORDER BY a
 -- explain
-Expression ((Projection + (Before ORDER BY + )))
-  Aggregating
-    Filter
-      Filter (( + (Before GROUP BY + (Projection + (Before ORDER BY + (Projection + Before ORDER BY))))))
-        ReadFromSystemNumbers
+Expression (Projection)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + ))
+      Aggregating
+        Filter
+          Filter (( + (Before GROUP BY + (Projection + (Before ORDER BY + (Projection + Before ORDER BY))))))
+            ReadFromSystemNumbers
 -- execute
-2
 1
+2
 -- GROUP BY in most inner query makes execution parallelized, and removing inner sorting steps will keep it that way. But need to correctly update data streams sorting properties after removing sorting steps
 -- query
 SELECT *
diff --git a/tests/queries/0_stateless/02496_remove_redundant_sorting.sh b/tests/queries/0_stateless/02496_remove_redundant_sorting.sh
index 8b529c26d93..c676e0340b1 100755
--- a/tests/queries/0_stateless/02496_remove_redundant_sorting.sh
+++ b/tests/queries/0_stateless/02496_remove_redundant_sorting.sh
@@ -96,7 +96,8 @@ FROM
         ORDER BY number ASC
     )
     ORDER BY number DESC
-) AS t2"
+) AS t2
+ORDER BY t1.number, t2.number"
 run_query "$query"
 
 echo "-- CROSS JOIN with subqueries, ORDER BY in main query -> all ORDER BY clauses will be removed in subqueries"
@@ -138,7 +139,8 @@ FROM
     )
     ORDER BY number DESC
 )
-GROUP BY number"
+GROUP BY number
+ORDER BY number"
 run_query "$query"
 
 echo "-- GROUP BY with aggregation function which depends on order -> keep ORDER BY in first subquery, and eliminate in second subquery"
@@ -154,7 +156,8 @@ FROM
     )
     ORDER BY number DESC
 )
-GROUP BY number"
+GROUP BY number
+ORDER BY number"
 run_query "$query"
 
 echo "-- query with aggregation function but w/o GROUP BY -> remove sorting"
@@ -218,7 +221,8 @@ FROM
     )
     GROUP BY number
 )
-WHERE a > 0"
+WHERE a > 0
+ORDER BY a"
 run_query "$query"
 
 echo "-- GROUP BY in most inner query makes execution parallelized, and removing inner sorting steps will keep it that way. But need to correctly update data streams sorting properties after removing sorting steps"
diff --git a/tests/queries/0_stateless/02496_remove_redundant_sorting_analyzer.reference b/tests/queries/0_stateless/02496_remove_redundant_sorting_analyzer.reference
index ee2099c62ba..16d3327b9c2 100644
--- a/tests/queries/0_stateless/02496_remove_redundant_sorting_analyzer.reference
+++ b/tests/queries/0_stateless/02496_remove_redundant_sorting_analyzer.reference
@@ -113,27 +113,26 @@ FROM
     )
     ORDER BY number DESC
 ) AS t2
+ORDER BY t1.number, t2.number
 -- explain
-Expression ((Project names + (Projection + DROP unused columns after JOIN)))
-  Join (JOIN FillRightFirst)
-    Expression ((Change column names to column identifiers + Project names))
-      Sorting (Sorting for ORDER BY)
-        Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))
+Expression (Project names)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + (Projection + DROP unused columns after JOIN)))
+      Join (JOIN FillRightFirst)
+        Expression ((Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))))
           ReadFromSystemNumbers
-    Expression ((Change column names to column identifiers + Project names))
-      Sorting (Sorting for ORDER BY)
-        Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))
+        Expression ((Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))))
           ReadFromSystemNumbers
 -- execute
-0	2
-0	1
 0	0
-1	2
-1	1
+0	1
+0	2
 1	0
-2	2
-2	1
+1	1
+1	2
 2	0
+2	1
+2	2
 -- CROSS JOIN with subqueries, ORDER BY in main query -> all ORDER BY clauses will be removed in subqueries
 -- query
 SELECT *
@@ -193,15 +192,18 @@ FROM
     ORDER BY number DESC
 )
 GROUP BY number
+ORDER BY number
 -- explain
-Expression ((Project names + Projection))
-  Aggregating
-    Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers))))))))))
-      ReadFromSystemNumbers
+Expression (Project names)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + Projection))
+      Aggregating
+        Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers))))))))))
+          ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 -- GROUP BY with aggregation function which depends on order -> keep ORDER BY in first subquery, and eliminate in second subquery
 -- query
 SELECT any(number)
@@ -217,17 +219,20 @@ FROM
     ORDER BY number DESC
 )
 GROUP BY number
+ORDER BY number
 -- explain
-Expression ((Project names + Projection))
-  Aggregating
-    Expression ((Before GROUP BY + (Change column names to column identifiers + Project names)))
-      Sorting (Sorting for ORDER BY)
-        Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))
-          ReadFromSystemNumbers
+Expression (Project names)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + Projection))
+      Aggregating
+        Expression ((Before GROUP BY + (Change column names to column identifiers + Project names)))
+          Sorting (Sorting for ORDER BY)
+            Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))
+              ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 -- query with aggregation function but w/o GROUP BY -> remove sorting
 -- query
 SELECT sum(number)
@@ -319,17 +324,20 @@ FROM
     GROUP BY number
 )
 WHERE a > 0
+ORDER BY a
 -- explain
-Expression ((Project names + Projection))
-  Filter ((WHERE + (Change column names to column identifiers + (Project names + Projection))))
-    Aggregating
-      Expression ((Before GROUP BY + (Change column names to column identifiers + Project names)))
-        Sorting (Sorting for ORDER BY)
-          Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))
-            ReadFromSystemNumbers
+Expression (Project names)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + Projection))
+      Filter ((WHERE + (Change column names to column identifiers + (Project names + Projection))))
+        Aggregating
+          Expression ((Before GROUP BY + (Change column names to column identifiers + Project names)))
+            Sorting (Sorting for ORDER BY)
+              Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Before ORDER BY + (Projection + Change column names to column identifiers)))))))
+                ReadFromSystemNumbers
 -- execute
-2
 1
+2
 -- GROUP BY in most inner query makes execution parallelized, and removing inner sorting steps will keep it that way. But need to correctly update data streams sorting properties after removing sorting steps
 -- query
 SELECT *
diff --git a/tests/queries/0_stateless/02498_analyzer_settings_push_down.sql b/tests/queries/0_stateless/02498_analyzer_settings_push_down.sql
index 91bdce2cca9..67623869f0a 100644
--- a/tests/queries/0_stateless/02498_analyzer_settings_push_down.sql
+++ b/tests/queries/0_stateless/02498_analyzer_settings_push_down.sql
@@ -1,4 +1,5 @@
 SET allow_experimental_analyzer = 1;
+SET optimize_functions_to_subcolumns = 0;
 
 DROP TABLE IF EXISTS test_table;
 CREATE TABLE test_table (id UInt64, value Tuple(a UInt64)) ENGINE=MergeTree ORDER BY id;
diff --git a/tests/queries/0_stateless/02500_prevent_drop_nested_if_empty_part.sql b/tests/queries/0_stateless/02500_prevent_drop_nested_if_empty_part.sql
index 529f574d32d..d8564546b0e 100644
--- a/tests/queries/0_stateless/02500_prevent_drop_nested_if_empty_part.sql
+++ b/tests/queries/0_stateless/02500_prevent_drop_nested_if_empty_part.sql
@@ -2,41 +2,19 @@ DROP TABLE IF EXISTS 02500_nested;
 
 SET flatten_nested = 1;
 
-CREATE TABLE 02500_nested(arr Array(Tuple(a Int32, b Int32))) Engine=MergeTree ORDER BY tuple();
-INSERT INTO 02500_nested(arr.a, arr.b) VALUES ([1], [2]);
-ALTER TABLE 02500_nested ADD COLUMN z Int32;
-ALTER TABLE 02500_nested DROP COLUMN arr; -- { serverError BAD_ARGUMENTS }
-DROP TABLE 02500_nested;
-
-CREATE TABLE 02500_nested(arr Array(Tuple(a Int32, b Int32)), z Int32) Engine=MergeTree ORDER BY tuple();
-INSERT INTO 02500_nested(arr.a, arr.b, z) VALUES ([1], [2], 2);
-ALTER TABLE 02500_nested DROP COLUMN arr;
-DROP TABLE 02500_nested;
-
 CREATE TABLE 02500_nested(nes Nested(a Int32, b Int32)) Engine=MergeTree ORDER BY tuple();
 INSERT INTO 02500_nested(nes.a, nes.b) VALUES ([1], [2]);
 ALTER TABLE 02500_nested ADD COLUMN z Int32;
 ALTER TABLE 02500_nested DROP COLUMN nes; -- { serverError BAD_ARGUMENTS }
 DROP TABLE 02500_nested;
 
-CREATE TABLE 02500_nested(nes Array(Tuple(a Int32, b Int32)), z Int32) Engine=MergeTree ORDER BY tuple();
+CREATE TABLE 02500_nested(nes Nested(a Int32, b Int32), z Int32) Engine=MergeTree ORDER BY tuple();
 INSERT INTO 02500_nested(nes.a, nes.b, z) VALUES ([1], [2], 2);
 ALTER TABLE 02500_nested DROP COLUMN nes;
 DROP TABLE 02500_nested;
 
 SET flatten_nested = 0;
 
-CREATE TABLE 02500_nested(arr Array(Tuple(a Int32, b Int32))) Engine=MergeTree ORDER BY tuple();
-INSERT INTO 02500_nested(arr) VALUES ([(1, 2)]);
-ALTER TABLE 02500_nested ADD COLUMN z Int32;
-ALTER TABLE 02500_nested DROP COLUMN arr; -- { serverError BAD_ARGUMENTS }
-DROP TABLE 02500_nested;
-
-CREATE TABLE 02500_nested(arr Array(Tuple(a Int32, b Int32)), z Int32) Engine=MergeTree ORDER BY tuple();
-INSERT INTO 02500_nested(arr, z) VALUES ([(1, 2)], 2);
-ALTER TABLE 02500_nested DROP COLUMN arr;
-DROP TABLE 02500_nested;
-
 CREATE TABLE 02500_nested(nes Nested(a Int32, b Int32)) Engine=MergeTree ORDER BY tuple();
 INSERT INTO 02500_nested(nes) VALUES ([(1, 2)]);
 ALTER TABLE 02500_nested ADD COLUMN z Int32;
diff --git a/tests/queries/0_stateless/02500_remove_redundant_distinct.reference b/tests/queries/0_stateless/02500_remove_redundant_distinct.reference
index 3f580763dba..d7623cd5541 100644
--- a/tests/queries/0_stateless/02500_remove_redundant_distinct.reference
+++ b/tests/queries/0_stateless/02500_remove_redundant_distinct.reference
@@ -73,22 +73,24 @@ FROM
     SELECT DISTINCT number AS n
     FROM numbers(2)
 ) as y
+ORDER BY x.n, y.n
 -- explain
 Expression (Projection)
   Distinct
-    Distinct (Preliminary DISTINCT)
-      Expression (Before ORDER BY)
-        Join (JOIN FillRightFirst)
-          Expression ((Before JOIN + Projection))
-            Distinct
-              Distinct (Preliminary DISTINCT)
-                Expression (Before ORDER BY)
-                  ReadFromSystemNumbers
-          Expression ((Joined actions + (Rename joined columns + Projection)))
-            Distinct
-              Distinct (Preliminary DISTINCT)
-                Expression (Before ORDER BY)
-                  ReadFromSystemNumbers
+    Sorting (Sorting for ORDER BY)
+      Distinct (Preliminary DISTINCT)
+        Expression (Before ORDER BY)
+          Join (JOIN FillRightFirst)
+            Expression ((Before JOIN + Projection))
+              Distinct
+                Distinct (Preliminary DISTINCT)
+                  Expression (Before ORDER BY)
+                    ReadFromSystemNumbers
+            Expression ((Joined actions + (Rename joined columns + Projection)))
+              Distinct
+                Distinct (Preliminary DISTINCT)
+                  Expression (Before ORDER BY)
+                    ReadFromSystemNumbers
 -- execute
 0	0
 0	1
@@ -106,12 +108,15 @@ FROM
         FROM numbers(3)
     )
 )
+ORDER BY a, b
 -- explain
-Expression ((Projection + (Before ORDER BY + (Projection + (Before ORDER BY + Projection)))))
-  Distinct
-    Distinct (Preliminary DISTINCT)
-      Expression (Before ORDER BY)
-        ReadFromSystemNumbers
+Expression (Projection)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + (Projection + (Before ORDER BY + Projection))))
+      Distinct
+        Distinct (Preliminary DISTINCT)
+          Expression (Before ORDER BY)
+            ReadFromSystemNumbers
 -- execute
 0	0
 1	2
@@ -128,12 +133,15 @@ FROM
         FROM numbers(3)
     )
 )
+ORDER BY a, b
 -- explain
-Expression ((Projection + (Before ORDER BY + (Projection + (Before ORDER BY + Projection)))))
-  Distinct
-    Distinct (Preliminary DISTINCT)
-      Expression (Before ORDER BY)
-        ReadFromSystemNumbers
+Expression (Projection)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + (Projection + (Before ORDER BY + Projection))))
+      Distinct
+        Distinct (Preliminary DISTINCT)
+          Expression (Before ORDER BY)
+            ReadFromSystemNumbers
 -- execute
 2	0	0
 2	1	2
@@ -147,21 +155,23 @@ FROM
     FROM VALUES('Hello', 'World', 'Goodbye')
 ) AS words
 ARRAY JOIN [0, 1] AS arr
+ORDER BY c1, arr
 -- explain
 Expression (Projection)
   Distinct
-    Distinct (Preliminary DISTINCT)
-      Expression (Before ORDER BY)
-        ArrayJoin (ARRAY JOIN)
-          Expression ((Before ARRAY JOIN + Projection))
-            Distinct
-              Distinct (Preliminary DISTINCT)
-                Expression (Before ORDER BY)
-                  ReadFromStorage (Values)
+    Sorting (Sorting for ORDER BY)
+      Distinct (Preliminary DISTINCT)
+        Expression (Before ORDER BY)
+          ArrayJoin (ARRAY JOIN)
+            Expression ((Before ARRAY JOIN + Projection))
+              Distinct
+                Distinct (Preliminary DISTINCT)
+                  Expression (Before ORDER BY)
+                    ReadFromStorage (Values)
 -- execute
+Goodbye
 Hello
 World
-Goodbye
 -- WITH FILL: do _not_ remove outer DISTINCT because new rows are generated between inner and outer DISTINCTs
 -- query
 SELECT DISTINCT *
@@ -194,16 +204,18 @@ FROM
     SELECT DISTINCT ['Istanbul', 'Berlin', 'Bensheim'] AS cities
 )
 WHERE arrayJoin(cities) IN ['Berlin', 'Bensheim']
+ORDER BY cities
 -- explain
 Expression (( + Projection))
   Distinct
-    Distinct (Preliminary DISTINCT)
-      Expression (Before ORDER BY)
-        Filter ((WHERE + Projection))
-          Distinct
-            Distinct (Preliminary DISTINCT)
-              Expression (Before ORDER BY)
-                ReadFromStorage (SystemOne)
+    Sorting (Sorting for ORDER BY)
+      Distinct (Preliminary DISTINCT)
+        Expression (Before ORDER BY)
+          Filter ((WHERE + Projection))
+            Distinct
+              Distinct (Preliminary DISTINCT)
+                Expression (Before ORDER BY)
+                  ReadFromStorage (SystemOne)
 -- execute
 ['Istanbul','Berlin','Bensheim']
 -- GROUP BY before DISTINCT with on the same columns => remove DISTINCT
@@ -222,20 +234,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a
+    ORDER BY a
 )
 -- explain
-Expression ((Projection + (Before ORDER BY + (Projection + Before ORDER BY))))
-  Aggregating
-    Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-      Join (JOIN FillRightFirst)
-        Expression (Before JOIN)
-          ReadFromSystemNumbers
-        Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-          ReadFromSystemNumbers
+Expression ((Projection + (Before ORDER BY + Projection)))
+  Sorting (Sorting for ORDER BY)
+    Expression (Before ORDER BY)
+      Aggregating
+        Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+          Join (JOIN FillRightFirst)
+            Expression (Before JOIN)
+              ReadFromSystemNumbers
+            Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+              ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 -- GROUP BY before DISTINCT with on different columns => do _not_ remove DISTINCT
 -- query
 SELECT DISTINCT c
@@ -252,19 +267,22 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a
+    ORDER BY a
 )
 -- explain
 Expression (Projection)
   Distinct
     Distinct (Preliminary DISTINCT)
-      Expression ((Before ORDER BY + (Projection + Before ORDER BY)))
-        Aggregating
-          Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-            Join (JOIN FillRightFirst)
-              Expression (Before JOIN)
-                ReadFromSystemNumbers
-              Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-                ReadFromSystemNumbers
+      Expression ((Before ORDER BY + Projection))
+        Sorting (Sorting for ORDER BY)
+          Expression (Before ORDER BY)
+            Aggregating
+              Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+                Join (JOIN FillRightFirst)
+                  Expression (Before JOIN)
+                    ReadFromSystemNumbers
+                  Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+                    ReadFromSystemNumbers
 -- execute
 12
 -- GROUP BY WITH ROLLUP before DISTINCT with on different columns => do _not_ remove DISTINCT
@@ -283,20 +301,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH ROLLUP
+    ORDER BY a
 )
 -- explain
 Expression (Projection)
   Distinct
     Distinct (Preliminary DISTINCT)
-      Expression ((Before ORDER BY + (Projection + Before ORDER BY)))
-        Rollup
-          Aggregating
-            Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-              Join (JOIN FillRightFirst)
-                Expression (Before JOIN)
-                  ReadFromSystemNumbers
-                Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-                  ReadFromSystemNumbers
+      Expression ((Before ORDER BY + Projection))
+        Sorting (Sorting for ORDER BY)
+          Expression (Before ORDER BY)
+            Rollup
+              Aggregating
+                Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+                  Join (JOIN FillRightFirst)
+                    Expression (Before JOIN)
+                      ReadFromSystemNumbers
+                    Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+                      ReadFromSystemNumbers
 -- execute
 12
 36
@@ -316,22 +337,25 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH ROLLUP
+    ORDER BY a
 )
 -- explain
-Expression ((Projection + (Before ORDER BY + (Projection + Before ORDER BY))))
-  Rollup
-    Aggregating
-      Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-        Join (JOIN FillRightFirst)
-          Expression (Before JOIN)
-            ReadFromSystemNumbers
-          Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-            ReadFromSystemNumbers
+Expression ((Projection + (Before ORDER BY + Projection)))
+  Sorting (Sorting for ORDER BY)
+    Expression (Before ORDER BY)
+      Rollup
+        Aggregating
+          Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+            Join (JOIN FillRightFirst)
+              Expression (Before JOIN)
+                ReadFromSystemNumbers
+              Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+                ReadFromSystemNumbers
 -- execute
 0
-2
-1
 0
+1
+2
 -- GROUP BY WITH CUBE before DISTINCT with on different columns => do _not_ remove DISTINCT
 -- query
 SELECT DISTINCT c
@@ -348,20 +372,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH CUBE
+    ORDER BY a
 )
 -- explain
 Expression (Projection)
   Distinct
     Distinct (Preliminary DISTINCT)
-      Expression ((Before ORDER BY + (Projection + Before ORDER BY)))
-        Cube
-          Aggregating
-            Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-              Join (JOIN FillRightFirst)
-                Expression (Before JOIN)
-                  ReadFromSystemNumbers
-                Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-                  ReadFromSystemNumbers
+      Expression ((Before ORDER BY + Projection))
+        Sorting (Sorting for ORDER BY)
+          Expression (Before ORDER BY)
+            Cube
+              Aggregating
+                Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+                  Join (JOIN FillRightFirst)
+                    Expression (Before JOIN)
+                      ReadFromSystemNumbers
+                    Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+                      ReadFromSystemNumbers
 -- execute
 12
 36
@@ -381,22 +408,25 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH CUBE
+    ORDER BY a
 )
 -- explain
-Expression ((Projection + (Before ORDER BY + (Projection + Before ORDER BY))))
-  Cube
-    Aggregating
-      Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-        Join (JOIN FillRightFirst)
-          Expression (Before JOIN)
-            ReadFromSystemNumbers
-          Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-            ReadFromSystemNumbers
+Expression ((Projection + (Before ORDER BY + Projection)))
+  Sorting (Sorting for ORDER BY)
+    Expression (Before ORDER BY)
+      Cube
+        Aggregating
+          Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+            Join (JOIN FillRightFirst)
+              Expression (Before JOIN)
+                ReadFromSystemNumbers
+              Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+                ReadFromSystemNumbers
 -- execute
 0
-2
-1
 0
+1
+2
 -- GROUP BY WITH TOTALS before DISTINCT with on different columns => do _not_ remove DISTINCT
 -- query
 SELECT DISTINCT c
@@ -413,20 +443,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH TOTALS
+    ORDER BY a
 )
 -- explain
 Expression (Projection)
   Distinct
     Distinct (Preliminary DISTINCT)
-      Expression ((Before ORDER BY + (Projection + Before ORDER BY)))
-        TotalsHaving
-          Aggregating
-            Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-              Join (JOIN FillRightFirst)
-                Expression (Before JOIN)
-                  ReadFromSystemNumbers
-                Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-                  ReadFromSystemNumbers
+      Expression ((Before ORDER BY + Projection))
+        Sorting (Sorting for ORDER BY)
+          Expression (Before ORDER BY)
+            TotalsHaving
+              Aggregating
+                Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+                  Join (JOIN FillRightFirst)
+                    Expression (Before JOIN)
+                      ReadFromSystemNumbers
+                    Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+                      ReadFromSystemNumbers
 -- execute
 12
 
@@ -447,21 +480,24 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH TOTALS
+    ORDER BY a
 )
 -- explain
-Expression ((Projection + (Before ORDER BY + (Projection + Before ORDER BY))))
-  TotalsHaving
-    Aggregating
-      Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
-        Join (JOIN FillRightFirst)
-          Expression (Before JOIN)
-            ReadFromSystemNumbers
-          Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
-            ReadFromSystemNumbers
+Expression ((Projection + (Before ORDER BY + Projection)))
+  Sorting (Sorting for ORDER BY)
+    Expression (Before ORDER BY)
+      TotalsHaving
+        Aggregating
+          Expression ((Before GROUP BY + (Projection + Before ORDER BY)))
+            Join (JOIN FillRightFirst)
+              Expression (Before JOIN)
+                ReadFromSystemNumbers
+              Expression ((Joined actions + (Rename joined columns + (Projection + Before ORDER BY))))
+                ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 
 0
 -- DISTINCT COUNT() with GROUP BY => do _not_ remove DISTINCT
@@ -488,21 +524,23 @@ FROM
     SELECT DISTINCT number
     FROM numbers(2)
 )
+ORDER BY number
 -- explain
 Expression (Projection)
   Distinct
-    Distinct (Preliminary DISTINCT)
-      Union
-        Expression ((Before ORDER BY + Projection))
-          Distinct
-            Distinct (Preliminary DISTINCT)
-              Expression (Before ORDER BY)
-                ReadFromSystemNumbers
-        Expression (( + Projection))
-          Distinct
-            Distinct (Preliminary DISTINCT)
-              Expression (Before ORDER BY)
-                ReadFromSystemNumbers
+    Sorting (Sorting for ORDER BY)
+      Distinct (Preliminary DISTINCT)
+        Union
+          Expression ((Before ORDER BY + Projection))
+            Distinct
+              Distinct (Preliminary DISTINCT)
+                Expression (Before ORDER BY)
+                  ReadFromSystemNumbers
+          Expression (( + Projection))
+            Distinct
+              Distinct (Preliminary DISTINCT)
+                Expression (Before ORDER BY)
+                  ReadFromSystemNumbers
 -- execute
 0
 1
diff --git a/tests/queries/0_stateless/02500_remove_redundant_distinct.sh b/tests/queries/0_stateless/02500_remove_redundant_distinct.sh
index f07cdca4b5a..c4f0994cd13 100755
--- a/tests/queries/0_stateless/02500_remove_redundant_distinct.sh
+++ b/tests/queries/0_stateless/02500_remove_redundant_distinct.sh
@@ -59,7 +59,8 @@ FROM
 (
     SELECT DISTINCT number AS n
     FROM numbers(2)
-) as y"
+) as y
+ORDER BY x.n, y.n"
 run_query "$query"
 
 echo "-- DISTINCT duplicates with several columns"
@@ -72,7 +73,8 @@ FROM
         SELECT DISTINCT number as a, 2*number as b
         FROM numbers(3)
     )
-)"
+)
+ORDER BY a, b"
 run_query "$query"
 
 echo "-- DISTINCT duplicates with constant columns"
@@ -85,7 +87,8 @@ FROM
         SELECT DISTINCT 1, number as a, 2*number as b
         FROM numbers(3)
     )
-)"
+)
+ORDER BY a, b"
 run_query "$query"
 
 echo "-- ARRAY JOIN: do _not_ remove outer DISTINCT because new rows are generated between inner and outer DISTINCTs"
@@ -95,7 +98,8 @@ FROM
     SELECT DISTINCT *
     FROM VALUES('Hello', 'World', 'Goodbye')
 ) AS words
-ARRAY JOIN [0, 1] AS arr"
+ARRAY JOIN [0, 1] AS arr
+ORDER BY c1, arr"
 run_query "$query"
 
 echo "-- WITH FILL: do _not_ remove outer DISTINCT because new rows are generated between inner and outer DISTINCTs"
@@ -114,7 +118,8 @@ FROM
 (
     SELECT DISTINCT ['Istanbul', 'Berlin', 'Bensheim'] AS cities
 )
-WHERE arrayJoin(cities) IN ['Berlin', 'Bensheim']"
+WHERE arrayJoin(cities) IN ['Berlin', 'Bensheim']
+ORDER BY cities"
 run_query "$query"
 
 echo "-- GROUP BY before DISTINCT with on the same columns => remove DISTINCT"
@@ -132,6 +137,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -150,6 +156,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -168,6 +175,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH ROLLUP
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -186,6 +194,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH ROLLUP
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -204,6 +213,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH CUBE
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -222,6 +232,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH CUBE
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -240,6 +251,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH TOTALS
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -258,6 +270,7 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH TOTALS
+    ORDER BY a
 )"
 run_query "$query"
 
@@ -274,5 +287,6 @@ FROM
     UNION ALL
     SELECT DISTINCT number
     FROM numbers(2)
-)"
+)
+ORDER BY number"
 run_query "$query"
diff --git a/tests/queries/0_stateless/02500_remove_redundant_distinct_analyzer.reference b/tests/queries/0_stateless/02500_remove_redundant_distinct_analyzer.reference
index a5f2c3e5ca3..b79f6310166 100644
--- a/tests/queries/0_stateless/02500_remove_redundant_distinct_analyzer.reference
+++ b/tests/queries/0_stateless/02500_remove_redundant_distinct_analyzer.reference
@@ -74,22 +74,25 @@ FROM
     SELECT DISTINCT number AS n
     FROM numbers(2)
 ) as y
+ORDER BY x.n, y.n
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
-    Distinct (Preliminary DISTINCT)
-      Expression ((Projection + DROP unused columns after JOIN))
-        Join (JOIN FillRightFirst)
-          Expression ((Change column names to column identifiers + Project names))
-            Distinct (DISTINCT)
-              Distinct (Preliminary DISTINCT)
-                Expression ((Projection + Change column names to column identifiers))
-                  ReadFromSystemNumbers
-          Expression ((Change column names to column identifiers + Project names))
-            Distinct (DISTINCT)
-              Distinct (Preliminary DISTINCT)
-                Expression ((Projection + Change column names to column identifiers))
-                  ReadFromSystemNumbers
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        Distinct (Preliminary DISTINCT)
+          Expression ((Projection + DROP unused columns after JOIN))
+            Join (JOIN FillRightFirst)
+              Expression ((Change column names to column identifiers + Project names))
+                Distinct (DISTINCT)
+                  Distinct (Preliminary DISTINCT)
+                    Expression ((Projection + Change column names to column identifiers))
+                      ReadFromSystemNumbers
+              Expression ((Change column names to column identifiers + Project names))
+                Distinct (DISTINCT)
+                  Distinct (Preliminary DISTINCT)
+                    Expression ((Projection + Change column names to column identifiers))
+                      ReadFromSystemNumbers
 -- execute
 0	0
 0	1
@@ -107,12 +110,15 @@ FROM
         FROM numbers(3)
     )
 )
+ORDER BY a, b
 -- explain
-Expression ((Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + (Change column names to column identifiers + Project names)))))))
-  Distinct (DISTINCT)
-    Distinct (Preliminary DISTINCT)
-      Expression ((Projection + Change column names to column identifiers))
-        ReadFromSystemNumbers
+Expression (Project names)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Projection + (Change column names to column identifiers + Project names)))))))
+      Distinct (DISTINCT)
+        Distinct (Preliminary DISTINCT)
+          Expression ((Projection + Change column names to column identifiers))
+            ReadFromSystemNumbers
 -- execute
 0	0
 1	2
@@ -129,12 +135,15 @@ FROM
         FROM numbers(3)
     )
 )
+ORDER BY a, b
 -- explain
-Expression ((Project names + (Projection + (Change column names to column identifiers + (Project names + (Projection + (Change column names to column identifiers + Project names)))))))
-  Distinct (DISTINCT)
-    Distinct (Preliminary DISTINCT)
-      Expression ((Projection + Change column names to column identifiers))
-        ReadFromSystemNumbers
+Expression (Project names)
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + (Projection + (Change column names to column identifiers + (Project names + (Projection + (Change column names to column identifiers + Project names)))))))
+      Distinct (DISTINCT)
+        Distinct (Preliminary DISTINCT)
+          Expression ((Projection + Change column names to column identifiers))
+            ReadFromSystemNumbers
 -- execute
 2	0	0
 2	1	2
@@ -148,21 +157,24 @@ FROM
     FROM VALUES('Hello', 'World', 'Goodbye')
 ) AS words
 ARRAY JOIN [0, 1] AS arr
+ORDER BY c1, arr
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
-    Distinct (Preliminary DISTINCT)
-      Expression (Projection)
-        ArrayJoin (ARRAY JOIN)
-          Expression ((DROP unused columns before ARRAY JOIN + (ARRAY JOIN actions + (Change column names to column identifiers + Project names))))
-            Distinct (DISTINCT)
-              Distinct (Preliminary DISTINCT)
-                Expression ((Projection + Change column names to column identifiers))
-                  ReadFromStorage (Values)
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        Distinct (Preliminary DISTINCT)
+          Expression (Projection)
+            ArrayJoin (ARRAY JOIN)
+              Expression ((DROP unused columns before ARRAY JOIN + (ARRAY JOIN actions + (Change column names to column identifiers + Project names))))
+                Distinct (DISTINCT)
+                  Distinct (Preliminary DISTINCT)
+                    Expression ((Projection + Change column names to column identifiers))
+                      ReadFromStorage (Values)
 -- execute
+Goodbye
 Hello
 World
-Goodbye
 -- WITH FILL: do _not_ remove outer DISTINCT because new rows are generated between inner and outer DISTINCTs
 -- query
 SELECT DISTINCT *
@@ -196,16 +208,19 @@ FROM
     SELECT DISTINCT ['Istanbul', 'Berlin', 'Bensheim'] AS cities
 )
 WHERE arrayJoin(cities) IN ['Berlin', 'Bensheim']
+ORDER BY cities
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
-    Distinct (Preliminary DISTINCT)
-      Expression (Projection)
-        Filter ((WHERE + (Change column names to column identifiers + Project names)))
-          Distinct (DISTINCT)
-            Distinct (Preliminary DISTINCT)
-              Expression ((Projection + Change column names to column identifiers))
-                ReadFromStorage (SystemOne)
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        Distinct (Preliminary DISTINCT)
+          Expression (Projection)
+            Filter ((WHERE + (Change column names to column identifiers + Project names)))
+              Distinct (DISTINCT)
+                Distinct (Preliminary DISTINCT)
+                  Expression ((Projection + Change column names to column identifiers))
+                    ReadFromStorage (SystemOne)
 -- execute
 ['Istanbul','Berlin','Bensheim']
 -- GROUP BY before DISTINCT with on the same columns => remove DISTINCT
@@ -224,20 +239,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a
+    ORDER BY a
 )
 -- explain
-Expression ((Project names + (Projection + (Change column names to column identifiers + (Project names + Projection)))))
-  Aggregating
-    Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-      Join (JOIN FillRightFirst)
-        Expression (Change column names to column identifiers)
-          ReadFromSystemNumbers
-        Expression (Change column names to column identifiers)
-          ReadFromSystemNumbers
+Expression ((Project names + (Projection + (Change column names to column identifiers + Project names))))
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + Projection))
+      Aggregating
+        Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+          Join (JOIN FillRightFirst)
+            Expression (Change column names to column identifiers)
+              ReadFromSystemNumbers
+            Expression (Change column names to column identifiers)
+              ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 -- GROUP BY before DISTINCT with on different columns => do _not_ remove DISTINCT
 -- query
 SELECT DISTINCT c
@@ -254,19 +272,22 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a
+    ORDER BY a
 )
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
     Distinct (Preliminary DISTINCT)
-      Expression ((Projection + (Change column names to column identifiers + (Project names + Projection))))
-        Aggregating
-          Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-            Join (JOIN FillRightFirst)
-              Expression (Change column names to column identifiers)
-                ReadFromSystemNumbers
-              Expression (Change column names to column identifiers)
-                ReadFromSystemNumbers
+      Expression ((Projection + (Change column names to column identifiers + Project names)))
+        Sorting (Sorting for ORDER BY)
+          Expression ((Before ORDER BY + Projection))
+            Aggregating
+              Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+                Join (JOIN FillRightFirst)
+                  Expression (Change column names to column identifiers)
+                    ReadFromSystemNumbers
+                  Expression (Change column names to column identifiers)
+                    ReadFromSystemNumbers
 -- execute
 12
 -- GROUP BY WITH ROLLUP before DISTINCT with on different columns => do _not_ remove DISTINCT
@@ -285,20 +306,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH ROLLUP
+    ORDER BY a
 )
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
     Distinct (Preliminary DISTINCT)
-      Expression ((Projection + (Change column names to column identifiers + (Project names + Projection))))
-        Rollup
-          Aggregating
-            Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-              Join (JOIN FillRightFirst)
-                Expression (Change column names to column identifiers)
-                  ReadFromSystemNumbers
-                Expression (Change column names to column identifiers)
-                  ReadFromSystemNumbers
+      Expression ((Projection + (Change column names to column identifiers + Project names)))
+        Sorting (Sorting for ORDER BY)
+          Expression ((Before ORDER BY + Projection))
+            Rollup
+              Aggregating
+                Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+                  Join (JOIN FillRightFirst)
+                    Expression (Change column names to column identifiers)
+                      ReadFromSystemNumbers
+                    Expression (Change column names to column identifiers)
+                      ReadFromSystemNumbers
 -- execute
 12
 36
@@ -318,22 +342,25 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH ROLLUP
+    ORDER BY a
 )
 -- explain
-Expression ((Project names + (Projection + (Change column names to column identifiers + (Project names + Projection)))))
-  Rollup
-    Aggregating
-      Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-        Join (JOIN FillRightFirst)
-          Expression (Change column names to column identifiers)
-            ReadFromSystemNumbers
-          Expression (Change column names to column identifiers)
-            ReadFromSystemNumbers
+Expression ((Project names + (Projection + (Change column names to column identifiers + Project names))))
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + Projection))
+      Rollup
+        Aggregating
+          Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+            Join (JOIN FillRightFirst)
+              Expression (Change column names to column identifiers)
+                ReadFromSystemNumbers
+              Expression (Change column names to column identifiers)
+                ReadFromSystemNumbers
 -- execute
 0
-2
-1
 0
+1
+2
 -- GROUP BY WITH CUBE before DISTINCT with on different columns => do _not_ remove DISTINCT
 -- query
 SELECT DISTINCT c
@@ -350,20 +377,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH CUBE
+    ORDER BY a
 )
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
     Distinct (Preliminary DISTINCT)
-      Expression ((Projection + (Change column names to column identifiers + (Project names + Projection))))
-        Cube
-          Aggregating
-            Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-              Join (JOIN FillRightFirst)
-                Expression (Change column names to column identifiers)
-                  ReadFromSystemNumbers
-                Expression (Change column names to column identifiers)
-                  ReadFromSystemNumbers
+      Expression ((Projection + (Change column names to column identifiers + Project names)))
+        Sorting (Sorting for ORDER BY)
+          Expression ((Before ORDER BY + Projection))
+            Cube
+              Aggregating
+                Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+                  Join (JOIN FillRightFirst)
+                    Expression (Change column names to column identifiers)
+                      ReadFromSystemNumbers
+                    Expression (Change column names to column identifiers)
+                      ReadFromSystemNumbers
 -- execute
 12
 36
@@ -383,22 +413,25 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH CUBE
+    ORDER BY a
 )
 -- explain
-Expression ((Project names + (Projection + (Change column names to column identifiers + (Project names + Projection)))))
-  Cube
-    Aggregating
-      Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-        Join (JOIN FillRightFirst)
-          Expression (Change column names to column identifiers)
-            ReadFromSystemNumbers
-          Expression (Change column names to column identifiers)
-            ReadFromSystemNumbers
+Expression ((Project names + (Projection + (Change column names to column identifiers + Project names))))
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + Projection))
+      Cube
+        Aggregating
+          Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+            Join (JOIN FillRightFirst)
+              Expression (Change column names to column identifiers)
+                ReadFromSystemNumbers
+              Expression (Change column names to column identifiers)
+                ReadFromSystemNumbers
 -- execute
 0
-2
-1
 0
+1
+2
 -- GROUP BY WITH TOTALS before DISTINCT with on different columns => do _not_ remove DISTINCT
 -- query
 SELECT DISTINCT c
@@ -415,20 +448,23 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH TOTALS
+    ORDER BY a
 )
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
     Distinct (Preliminary DISTINCT)
-      Expression ((Projection + (Change column names to column identifiers + (Project names + Projection))))
-        TotalsHaving
-          Aggregating
-            Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-              Join (JOIN FillRightFirst)
-                Expression (Change column names to column identifiers)
-                  ReadFromSystemNumbers
-                Expression (Change column names to column identifiers)
-                  ReadFromSystemNumbers
+      Expression ((Projection + (Change column names to column identifiers + Project names)))
+        Sorting (Sorting for ORDER BY)
+          Expression ((Before ORDER BY + Projection))
+            TotalsHaving
+              Aggregating
+                Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+                  Join (JOIN FillRightFirst)
+                    Expression (Change column names to column identifiers)
+                      ReadFromSystemNumbers
+                    Expression (Change column names to column identifiers)
+                      ReadFromSystemNumbers
 -- execute
 12
 
@@ -449,21 +485,24 @@ FROM
         FROM numbers(3) AS x, numbers(3, 3) AS y
     )
     GROUP BY a WITH TOTALS
+    ORDER BY a
 )
 -- explain
-Expression ((Project names + (Projection + (Change column names to column identifiers + (Project names + Projection)))))
-  TotalsHaving
-    Aggregating
-      Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
-        Join (JOIN FillRightFirst)
-          Expression (Change column names to column identifiers)
-            ReadFromSystemNumbers
-          Expression (Change column names to column identifiers)
-            ReadFromSystemNumbers
+Expression ((Project names + (Projection + (Change column names to column identifiers + Project names))))
+  Sorting (Sorting for ORDER BY)
+    Expression ((Before ORDER BY + Projection))
+      TotalsHaving
+        Aggregating
+          Expression ((Before GROUP BY + (Change column names to column identifiers + (Project names + (Projection + DROP unused columns after JOIN)))))
+            Join (JOIN FillRightFirst)
+              Expression (Change column names to column identifiers)
+                ReadFromSystemNumbers
+              Expression (Change column names to column identifiers)
+                ReadFromSystemNumbers
 -- execute
 0
-2
 1
+2
 
 0
 -- DISTINCT COUNT() with GROUP BY => do _not_ remove DISTINCT
@@ -490,21 +529,24 @@ FROM
     SELECT DISTINCT number
     FROM numbers(2)
 )
+ORDER BY number
 -- explain
 Expression (Project names)
   Distinct (DISTINCT)
-    Distinct (Preliminary DISTINCT)
-      Union
-        Expression ((Projection + (Change column names to column identifiers + Project names)))
-          Distinct (DISTINCT)
-            Distinct (Preliminary DISTINCT)
-              Expression ((Projection + Change column names to column identifiers))
-                ReadFromSystemNumbers
-        Expression (( + ( + Project names)))
-          Distinct (DISTINCT)
-            Distinct (Preliminary DISTINCT)
-              Expression ((Projection + Change column names to column identifiers))
-                ReadFromSystemNumbers
+    Sorting (Sorting for ORDER BY)
+      Expression (Before ORDER BY)
+        Distinct (Preliminary DISTINCT)
+          Union
+            Expression ((Projection + (Change column names to column identifiers + Project names)))
+              Distinct (DISTINCT)
+                Distinct (Preliminary DISTINCT)
+                  Expression ((Projection + Change column names to column identifiers))
+                    ReadFromSystemNumbers
+            Expression (( + ( + Project names)))
+              Distinct (DISTINCT)
+                Distinct (Preliminary DISTINCT)
+                  Expression ((Projection + Change column names to column identifiers))
+                    ReadFromSystemNumbers
 -- execute
 0
 1
diff --git a/tests/queries/0_stateless/02504_regexp_dictionary_ua_parser.sh b/tests/queries/0_stateless/02504_regexp_dictionary_ua_parser.sh
index 6e386360d60..d3a8743b880 100755
--- a/tests/queries/0_stateless/02504_regexp_dictionary_ua_parser.sh
+++ b/tests/queries/0_stateless/02504_regexp_dictionary_ua_parser.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p $user_files_path/test_02504
 
diff --git a/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh b/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh
index 34ea8b9bfbe..7211372f2f7 100755
--- a/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh
+++ b/tests/queries/0_stateless/02504_regexp_dictionary_yaml_source.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p $USER_FILES_PATH/test_02504
 
@@ -77,7 +77,7 @@ system reload dictionary regexp_dict1; -- { serverError 489 }
 "
 
 cat > "$yaml" <<EOL
-- regexp: 
+- regexp:
   name: 'TencentOS'
   version: '\1'
 EOL
diff --git a/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.reference b/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.reference
index 19da8828c30..86e7e2a6a49 100644
--- a/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.reference
+++ b/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.reference
@@ -9,3 +9,43 @@
 \N
 
 100000000000000000000
+---
+[]	0	['2']
+['0']	2	['0']
+['0']	2	['0']
+['1']	1	[]
+
+[]	3	[]
+---
+[]	0	['2']	1
+['0']	2	['0']	2
+['1']	1	[]	0
+
+[]	3	[]	3
+---
+[]	['2']	1
+['0']	['0']	2
+['0']	['0']	2
+['1']	[]	0
+
+[]	[]	3
+---
+[]	0	['2']
+['0']	2	['0']
+['0']	2	['0']
+['1']	1	[]
+
+[]	3	[]
+---
+[]	0	['2']	1
+['0']	2	['0']	2
+['1']	1	[]	0
+
+[]	3	[]	3
+---
+[]	['2']	1
+['0']	['0']	2
+['0']	['0']	2
+['1']	[]	0
+
+[]	[]	3
diff --git a/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.sql b/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.sql
deleted file mode 100644
index 6b58d737a3e..00000000000
--- a/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.sql
+++ /dev/null
@@ -1,74 +0,0 @@
-SET allow_experimental_analyzer = 1;
-
-SELECT *
-FROM
-(
-    SELECT 1 AS a
-) AS t1
-INNER JOIN
-(
-    SELECT 1 AS a
-    GROUP BY 1
-        WITH TOTALS
-    UNION ALL
-    SELECT 1
-    GROUP BY 1
-        WITH TOTALS
-) AS t2 USING (a)
-SETTINGS allow_experimental_analyzer=0;
-
-SELECT *
-FROM
-(
-    SELECT 1 AS a
-) AS t1
-INNER JOIN
-(
-    SELECT 1 AS a
-    GROUP BY 1
-        WITH TOTALS
-    UNION ALL
-    SELECT 1
-    GROUP BY 1
-        WITH TOTALS
-) AS t2 USING (a)
-SETTINGS allow_experimental_analyzer=1;
-
-
-SELECT a
-FROM
-(
-    SELECT
-        NULL AS a,
-        NULL AS b,
-        NULL AS c
-    UNION ALL
-    SELECT
-        100000000000000000000.,
-        NULL,
-        NULL
-    WHERE 0
-    GROUP BY
-        GROUPING SETS ((NULL))
-        WITH TOTALS
-) AS js1
-ALL LEFT JOIN
-(
-    SELECT
-        NULL AS a,
-        2147483647 AS d
-    GROUP BY
-        NULL,
-        '214748364.8'
-        WITH CUBE
-        WITH TOTALS
-    UNION ALL
-    SELECT
-        2147483646,
-        NULL
-    GROUP BY
-        base58Encode(materialize(NULL)),
-        NULL
-        WITH TOTALS
-) AS js2 USING (a)
-ORDER BY b ASC NULLS FIRST;
diff --git a/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.sql.j2 b/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.sql.j2
new file mode 100644
index 00000000000..09447dfce65
--- /dev/null
+++ b/tests/queries/0_stateless/02516_join_with_totals_and_subquery_bug.sql.j2
@@ -0,0 +1,122 @@
+SELECT *
+FROM
+(
+    SELECT 1 AS a
+) AS t1
+INNER JOIN
+(
+    SELECT 1 AS a
+    GROUP BY 1
+        WITH TOTALS
+    UNION ALL
+    SELECT 1
+    GROUP BY 1
+        WITH TOTALS
+) AS t2 USING (a)
+SETTINGS allow_experimental_analyzer=0;
+
+SELECT *
+FROM
+(
+    SELECT 1 AS a
+) AS t1
+INNER JOIN
+(
+    SELECT 1 AS a
+    GROUP BY 1
+        WITH TOTALS
+    UNION ALL
+    SELECT 1
+    GROUP BY 1
+        WITH TOTALS
+) AS t2 USING (a)
+SETTINGS allow_experimental_analyzer=1;
+
+SELECT a
+FROM
+(
+    SELECT
+        NULL AS a,
+        NULL AS b,
+        NULL AS c
+    UNION ALL
+    SELECT
+        100000000000000000000.,
+        NULL,
+        NULL
+    WHERE 0
+    GROUP BY
+        GROUPING SETS ((NULL))
+        WITH TOTALS
+) AS js1
+ALL LEFT JOIN
+(
+    SELECT
+        NULL AS a,
+        2147483647 AS d
+    GROUP BY
+        NULL,
+        '214748364.8'
+        WITH CUBE
+        WITH TOTALS
+    UNION ALL
+    SELECT
+        2147483646,
+        NULL
+    GROUP BY
+        base58Encode(materialize(NULL)),
+        NULL
+        WITH TOTALS
+) AS js2 USING (a)
+ORDER BY b ASC NULLS FIRST;
+
+
+
+{% for join_algorithm in ['default', 'partial_merge'] -%}
+
+SET join_algorithm = '{{ join_algorithm }}';
+
+SELECT '---';
+SELECT
+    *
+FROM (
+    SELECT ([toString(number % 2)] :: Array(LowCardinality(String))) AS item_id, count() FROM numbers(3) GROUP BY item_id
+    WITH TOTALS
+) AS l
+FULL JOIN (
+    SELECT ([toString((number % 2) * 2)] :: Array(String)) AS item_id FROM numbers(3)
+) AS r
+ON l.item_id = r.item_id
+ORDER BY 1,2,3
+;
+
+SELECT '---';
+SELECT
+    *
+FROM (
+    SELECT ([toString(number % 2)] :: Array(LowCardinality(String))) AS item_id, count() FROM numbers(3) GROUP BY item_id
+    WITH TOTALS
+) AS l
+FULL JOIN (
+    SELECT ([toString((number % 2) * 2)] :: Array(String)) AS item_id, count() FROM numbers(3) GROUP BY item_id
+    WITH TOTALS
+) AS r
+ON l.item_id = r.item_id
+ORDER BY 1,2,3
+;
+
+SELECT '---';
+SELECT
+    *
+FROM (
+    SELECT ([toString(number % 2)] :: Array(String)) AS item_id FROM numbers(3)
+) AS l
+FULL JOIN (
+    SELECT ([toString((number % 2) * 2)] :: Array(LowCardinality(String))) AS item_id, count() FROM numbers(3) GROUP BY item_id
+    WITH TOTALS
+) AS r
+ON l.item_id = r.item_id
+ORDER BY 1,2,3
+;
+
+{% endfor %}
diff --git a/tests/queries/0_stateless/02521_lightweight_delete_and_ttl.reference b/tests/queries/0_stateless/02521_lightweight_delete_and_ttl.reference
index 3b40d9048cd..e60b2a184db 100644
--- a/tests/queries/0_stateless/02521_lightweight_delete_and_ttl.reference
+++ b/tests/queries/0_stateless/02521_lightweight_delete_and_ttl.reference
@@ -15,7 +15,7 @@ SELECT 'Count', count() FROM lwd_test_02521;
 Count	25000
 ALTER TABLE lwd_test_02521 DELETE WHERE id >= 40000 SETTINGS mutations_sync = 1;
 SELECT 'Rows in parts', SUM(rows) FROM system.parts WHERE database = currentDatabase() AND table = 'lwd_test_02521' AND active;
-Rows in parts	40000
+Rows in parts	15000
 SELECT 'Count', count() FROM lwd_test_02521;
 Count	15000
 OPTIMIZE TABLE lwd_test_02521 FINAL SETTINGS mutations_sync = 1;
diff --git a/tests/queries/0_stateless/02567_and_consistency.sql b/tests/queries/0_stateless/02567_and_consistency.sql
index 8ad06bd68cb..0eeab99e539 100644
--- a/tests/queries/0_stateless/02567_and_consistency.sql
+++ b/tests/queries/0_stateless/02567_and_consistency.sql
@@ -5,6 +5,7 @@ FROM
 )
 GROUP BY number
 HAVING 1 AND sin(sum(number))
+ORDER BY ALL
 SETTINGS enable_optimize_predicate_expression = 0;
 
 SELECT '=====';
@@ -16,6 +17,7 @@ FROM
 )
 GROUP BY number
 HAVING 1 AND sin(1)
+ORDER BY ALL
 SETTINGS enable_optimize_predicate_expression = 0;
 
 SELECT '=====';
@@ -27,6 +29,7 @@ FROM
 )
 GROUP BY number
 HAVING x AND sin(sum(number))
+ORDER BY ALL
 SETTINGS enable_optimize_predicate_expression = 1;
 
 SELECT '=====';
@@ -38,6 +41,7 @@ FROM
 )
 GROUP BY number
 HAVING 1 AND sin(sum(number))
+ORDER BY ALL
 SETTINGS enable_optimize_predicate_expression = 0;
 
 SELECT '=====';
@@ -57,6 +61,7 @@ FROM
 )
 GROUP BY number
 HAVING 1 AND sin(sum(number))
+ORDER BY ALL
 SETTINGS enable_optimize_predicate_expression = 1;
 
 select '#45440';
@@ -72,14 +77,18 @@ SELECT
     NOT h,
     h IS NULL
 FROM t2 AS left
-GROUP BY g;
-select '=';
+GROUP BY g
+ORDER BY g DESC;
+
+SELECT '=';
+
 SELECT MAX(left.c0), min2(left.c0, -(-left.c0) * (radians(left.c0) - radians(left.c0))) as g, (((-1925024212 IS NOT NULL) IS NOT NULL) != radians(tan(1216286224))) AND cos(lcm(MAX(left.c0), -1966575216) OR (MAX(left.c0) * 1180517420)) as h, not h, h is null
                   FROM t2 AS left
-                  GROUP BY g HAVING h SETTINGS enable_optimize_predicate_expression = 0;
-select '=';
+                  GROUP BY g HAVING h ORDER BY g DESC SETTINGS enable_optimize_predicate_expression = 0;
+SELECT  '=';
+
 SELECT MAX(left.c0), min2(left.c0, -(-left.c0) * (radians(left.c0) - radians(left.c0))) as g, (((-1925024212 IS NOT NULL) IS NOT NULL) != radians(tan(1216286224))) AND cos(lcm(MAX(left.c0), -1966575216) OR (MAX(left.c0) * 1180517420)) as h, not h, h is null
                   FROM t2 AS left
-                  GROUP BY g HAVING h SETTINGS enable_optimize_predicate_expression = 1;
+                  GROUP BY g HAVING h ORDER BY g DESC SETTINGS enable_optimize_predicate_expression = 1;
 
 DROP TABLE IF EXISTS t2;
diff --git a/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.reference b/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.reference
index 60ff2d76995..089d1849eb4 100644
--- a/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.reference
+++ b/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.reference
@@ -87,4 +87,40 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: a, result_type: Int32, source_id: 3
           CONSTANT id: 8, constant_value: UInt64_2, constant_value_type: UInt8
+2	test2
+QUERY id: 0
+  PROJECTION COLUMNS
+    a Int32
+    b LowCardinality(String)
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: a, result_type: Int32, source_id: 3
+      COLUMN id: 4, column_name: b, result_type: LowCardinality(String), source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.02668_logical_optimizer
+  WHERE
+    FUNCTION id: 5, function_name: notIn, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: a, result_type: Int32, source_id: 3
+          CONSTANT id: 8, constant_value: Tuple_(UInt64_1, UInt64_3), constant_value_type: Tuple(UInt8, UInt8)
+2	test2
+3	another
+QUERY id: 0
+  PROJECTION COLUMNS
+    a Int32
+    b LowCardinality(String)
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: a, result_type: Int32, source_id: 3
+      COLUMN id: 4, column_name: b, result_type: LowCardinality(String), source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.02668_logical_optimizer
+  WHERE
+    FUNCTION id: 5, function_name: notEquals, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: a, result_type: Int32, source_id: 3
+          CONSTANT id: 8, constant_value: UInt64_1, constant_value_type: UInt8
+1
 1
diff --git a/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.sql b/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.sql
index eebea322dbf..7d624195df9 100644
--- a/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.sql
+++ b/tests/queries/0_stateless/02668_logical_optimizer_removing_redundant_checks.sql
@@ -8,6 +8,7 @@ ENGINE=Memory;
 
 INSERT INTO 02668_logical_optimizer VALUES (1, 'test'), (2, 'test2'), (3, 'another');
 
+-- Chain of OR equals
 SET optimize_min_equality_disjunction_chain_length = 2;
 
 SELECT * FROM 02668_logical_optimizer WHERE a = 1 OR 3 = a OR 1 = a;
@@ -16,6 +17,7 @@ EXPLAIN QUERY TREE SELECT * FROM 02668_logical_optimizer WHERE a = 1 OR 3 = a OR
 SELECT * FROM 02668_logical_optimizer WHERE a = 1 OR 1 = a;
 EXPLAIN QUERY TREE SELECT * FROM 02668_logical_optimizer WHERE a = 1 OR 1 = a;
 
+-- Chain of AND equals
 SELECT * FROM 02668_logical_optimizer WHERE a = 1 AND 2 = a;
 EXPLAIN QUERY TREE SELECT * FROM 02668_logical_optimizer WHERE a = 1 AND 2 = a;
 
@@ -25,4 +27,15 @@ EXPLAIN QUERY TREE SELECT * FROM 02668_logical_optimizer WHERE a = 3 AND b = 'an
 SELECT * FROM 02668_logical_optimizer WHERE a = 2 AND 2 = a;
 EXPLAIN QUERY TREE SELECT * FROM 02668_logical_optimizer WHERE a = 2 AND 2 = a;
 
+-- Chain of AND notEquals
+SET optimize_min_inequality_conjunction_chain_length = 2;
+
+SELECT * FROM 02668_logical_optimizer WHERE a <> 1 AND 3 <> a AND 1 <> a;
+EXPLAIN QUERY TREE SELECT * FROM 02668_logical_optimizer WHERE a <> 1 AND 3 <> a AND 1 <> a;
+
+SELECT * FROM 02668_logical_optimizer WHERE a <> 1 AND 1 <> a;
+EXPLAIN QUERY TREE SELECT * FROM 02668_logical_optimizer WHERE a <> 1 AND 1 <> a;
+
+SELECT a FROM 02668_logical_optimizer WHERE (b = 'test') AND ('test' = b);
+
 SELECT (k = 3) OR ( (k = 1) OR (k = 2) OR ( (NULL OR 1) = k ) ) FROM ( SELECT materialize(1) AS k );
diff --git a/tests/queries/0_stateless/02676_distinct_reading_in_order_analyzer.sql b/tests/queries/0_stateless/02676_distinct_reading_in_order_analyzer.sql
index a280a384c40..f9ff1eed111 100644
--- a/tests/queries/0_stateless/02676_distinct_reading_in_order_analyzer.sql
+++ b/tests/queries/0_stateless/02676_distinct_reading_in_order_analyzer.sql
@@ -5,4 +5,5 @@ set allow_experimental_analyzer=1;
 create table t (a UInt64, b UInt64) engine=MergeTree() order by (a);
 insert into t select number % 2, number from numbers(10);
 
+set optimize_distinct_in_order=1;
 select trimBoth(explain) from (explain pipeline select distinct a from t) where explain like '%InOrder%';
diff --git a/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.reference b/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.reference
index 573541ac970..b261da18d51 100644
--- a/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.reference
+++ b/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.reference
@@ -1 +1,2 @@
+1
 0
diff --git a/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.sh b/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.sh
index 09837bff808..2be13588453 100755
--- a/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.sh
+++ b/tests/queries/0_stateless/02697_stop_reading_on_first_cancel.sh
@@ -1,11 +1,18 @@
 #!/usr/bin/env bash
-
 CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT -n --query="SELECT sum(number * 0) FROM numbers(10000000000) SETTINGS partial_result_on_first_cancel=true;" &
+QUERY_ID="${CLICKHOUSE_DATABASE}_read_with_cancel"
+
+$CLICKHOUSE_CLIENT -n --query_id="$QUERY_ID" --query="SELECT sum(number * 0) FROM numbers(10000000000) SETTINGS partial_result_on_first_cancel=true;" &
 pid=$!
-sleep 2
+
+for _ in {0..60}
+do
+    ${CLICKHOUSE_CLIENT} --query "SELECT count() > 0 FROM system.processes WHERE query_id = '$QUERY_ID'" | grep -F '1' && break
+    sleep 0.5
+done
+
 kill -SIGINT $pid
 wait $pid
diff --git a/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.reference b/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.reference
index eb79bbc842a..e7f46a974e6 100644
--- a/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.reference
+++ b/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.reference
@@ -75,3 +75,5 @@ QUERY id: 0
         LIST id: 6, nodes: 2
           COLUMN id: 7, column_name: a, result_type: Nullable(Int32), source_id: 3
           CONSTANT id: 8, constant_value: Tuple_(UInt64_1, UInt64_3, UInt64_2), constant_value_type: Tuple(UInt8, UInt8, UInt8)
+1
+1
diff --git a/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.sql b/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.sql
index 07d0b170a02..72ab507f541 100644
--- a/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.sql
+++ b/tests/queries/0_stateless/02702_logical_optimizer_with_nulls.sql
@@ -29,4 +29,7 @@ INSERT INTO 02702_logical_optimizer_with_null_column VALUES (1, 'test'), (2, 'te
 SELECT * FROM 02702_logical_optimizer_with_null_column WHERE a = 1 OR 3 = a OR 2 = a;
 EXPLAIN QUERY TREE SELECT * FROM 02702_logical_optimizer_with_null_column WHERE a = 1 OR 3 = a OR 2 = a;
 
+SELECT materialize(1) AS k WHERE NULL OR (0 OR (k = 2) OR (k = CAST(1, 'Nullable(UInt8)') OR k = 3));
+SELECT (k = 2) OR (k = 1) OR ((NULL OR 1) = k) FROM (SELECT 1 AS k);
+
 DROP TABLE 02702_logical_optimizer_with_null_column;
diff --git a/tests/queries/0_stateless/02718_array_fold.reference b/tests/queries/0_stateless/02718_array_fold.reference
index 4139232d145..e746cd1546c 100644
--- a/tests/queries/0_stateless/02718_array_fold.reference
+++ b/tests/queries/0_stateless/02718_array_fold.reference
@@ -1,5 +1,5 @@
-Negative tests
-Const arrays
+-- Negative tests
+-- Const arrays
 23
 3
 101
@@ -7,7 +7,7 @@ Const arrays
 [4,3,2,1]
 ([4,3,2,1],[1,2,3,4])
 ([1,3,5],[2,4,6])
-Non-const arrays
+-- Non-const arrays
 0
 1
 3
@@ -23,3 +23,14 @@ Non-const arrays
 [1,0]
 [1,0,2]
 [3,1,0,2]
+-- Bug 57458
+abcdef	['c']	3
+ghijkl	['h','k']	5
+mnopqr	['n']	2
+xxx..yyy..	['xxx','yyy']	6
+..........	[]	0
+..xx..yyy.	['xx','yyy']	7
+..........	[]	0
+xxx.......	['xxx']	1
+ -- Bug 57816
+[]
diff --git a/tests/queries/0_stateless/02718_array_fold.sql b/tests/queries/0_stateless/02718_array_fold.sql
index 0486a5ce2e3..7dee33c4705 100644
--- a/tests/queries/0_stateless/02718_array_fold.sql
+++ b/tests/queries/0_stateless/02718_array_fold.sql
@@ -1,4 +1,4 @@
-SELECT 'Negative tests';
+SELECT '-- Negative tests';
 SELECT arrayFold(); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
 SELECT arrayFold(1); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
 SELECT arrayFold(1, toUInt64(0)); -- { serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH }
@@ -9,7 +9,7 @@ SELECT arrayFold( acc,x,y -> x,  [0, 1], 'not an array', toUInt8(0)); -- { serve
 SELECT arrayFold( acc,x -> x,  [0, 1], [2, 3], toUInt8(0)); -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT arrayFold( acc,x,y -> x,  [0, 1], [2, 3, 4], toUInt8(0)); -- { serverError SIZES_OF_ARRAYS_DONT_MATCH }
 
-SELECT 'Const arrays';
+SELECT '-- Const arrays';
 SELECT arrayFold( acc,x -> acc+x*2,  [1, 2, 3, 4], toInt64(3));
 SELECT arrayFold( acc,x -> acc+x*2,  emptyArrayInt64(), toInt64(3));
 SELECT arrayFold( acc,x,y -> acc+x*2+y*3,  [1, 2, 3, 4], [5, 6, 7, 8], toInt64(3));
@@ -18,7 +18,43 @@ SELECT arrayFold( acc,x -> arrayPushFront(acc, x),  [1, 2, 3, 4], emptyArrayInt6
 SELECT arrayFold( acc,x -> (arrayPushFront(acc.1, x),arrayPushBack(acc.2, x)),  [1, 2, 3, 4], (emptyArrayInt64(), emptyArrayInt64()));
 SELECT arrayFold( acc,x -> x%2 ? (arrayPushBack(acc.1, x), acc.2): (acc.1, arrayPushBack(acc.2, x)),  [1, 2, 3, 4, 5, 6], (emptyArrayInt64(), emptyArrayInt64()));
 
-SELECT 'Non-const arrays';
+SELECT '-- Non-const arrays';
 SELECT arrayFold( acc,x -> acc+x,  range(number), number) FROM system.numbers LIMIT 5;
 SELECT arrayFold( acc,x -> arrayPushFront(acc,x),  range(number), emptyArrayUInt64()) FROM system.numbers LIMIT 5;
 SELECT arrayFold( acc,x -> x%2 ? arrayPushFront(acc,x) : arrayPushBack(acc,x),  range(number), emptyArrayUInt64()) FROM system.numbers LIMIT 5;
+
+SELECT '-- Bug 57458';
+
+DROP TABLE IF EXISTS tab;
+
+CREATE TABLE tab (line String, patterns Array(String)) ENGINE = MergeTree ORDER BY line;
+INSERT INTO tab VALUES ('abcdef', ['c']), ('ghijkl', ['h', 'k']), ('mnopqr', ['n']);
+
+SELECT
+    line,
+    patterns,
+    arrayFold(acc, pat -> position(line, pat), patterns, 0::UInt64)
+FROM tab
+ORDER BY line;
+
+DROP TABLE tab;
+
+CREATE TABLE tab (line String) ENGINE = Memory();
+INSERT INTO tab VALUES ('xxx..yyy..'), ('..........'), ('..xx..yyy.'), ('..........'), ('xxx.......');
+
+SELECT
+    line,
+    splitByNonAlpha(line),
+    arrayFold(
+        (acc, str) -> position(line, str),
+        splitByNonAlpha(line),
+        0::UInt64
+    )
+FROM
+    tab;
+
+DROP TABLE tab;
+
+SELECT ' -- Bug 57816';
+
+SELECT arrayFold(acc, x -> arrayIntersect(acc, x), [['qwe', 'asd'], ['qwe','asde']], []);
diff --git a/tests/queries/0_stateless/02719_aggregate_with_empty_string_key.sql b/tests/queries/0_stateless/02719_aggregate_with_empty_string_key.sql
index 7930b2ca0cc..12572982ddd 100644
--- a/tests/queries/0_stateless/02719_aggregate_with_empty_string_key.sql
+++ b/tests/queries/0_stateless/02719_aggregate_with_empty_string_key.sql
@@ -2,6 +2,6 @@ drop table if exists test ;
 create table test(str Nullable(String), i Int64) engine=Memory();
 insert into test values(null, 1),('', 2),('s', 1);
 select '-----------String------------';
-select str ,max(i) from test group by str;
+select str, max(i) from test group by str order by str nulls first;
 
 drop table test;
diff --git a/tests/queries/0_stateless/02721_parquet_field_not_found.sh b/tests/queries/0_stateless/02721_parquet_field_not_found.sh
index 72925afec6e..8b366d0e9a2 100755
--- a/tests/queries/0_stateless/02721_parquet_field_not_found.sh
+++ b/tests/queries/0_stateless/02721_parquet_field_not_found.sh
@@ -5,5 +5,5 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-$CLICKHOUSE_LOCAL -q "select 42 as x format Parquet" | $CLICKHOUSE_LOCAL --input-format Parquet --structure "x UInt32, y UInt32" -q "select * from table" 2>&1 | grep -c "THERE_IS_NO_COLUMN"
+$CLICKHOUSE_LOCAL -q "select 42 as x format Parquet" | $CLICKHOUSE_LOCAL --input-format Parquet --structure "x UInt32, y UInt32" --input_format_parquet_allow_missing_columns=0 -q "select * from table" 2>&1 | grep -c "THERE_IS_NO_COLUMN"
 
diff --git a/tests/queries/0_stateless/02722_database_filesystem.sh b/tests/queries/0_stateless/02722_database_filesystem.sh
index c21b1af2ff4..f3af7abcbb3 100755
--- a/tests/queries/0_stateless/02722_database_filesystem.sh
+++ b/tests/queries/0_stateless/02722_database_filesystem.sh
@@ -6,7 +6,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 # see 01658_read_file_to_stringcolumn.sh
-CLICKHOUSE_USER_FILES_PATH=$(clickhouse-client --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+CLICKHOUSE_USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 # Prepare data
 unique_name=${CLICKHOUSE_TEST_UNIQUE_NAME}
diff --git a/tests/queries/0_stateless/02724_decompress_filename_exception.sh b/tests/queries/0_stateless/02724_decompress_filename_exception.sh
index bbc2b8d066b..e413910b934 100755
--- a/tests/queries/0_stateless/02724_decompress_filename_exception.sh
+++ b/tests/queries/0_stateless/02724_decompress_filename_exception.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 FILENAME="${USER_FILES_PATH}/corrupted_file.tsv.xx"
 
 echo 'corrupted file' > $FILENAME;
diff --git a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.sql b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.sql
index 29c20980c14..a117378b0bf 100644
--- a/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.sql
+++ b/tests/queries/0_stateless/02731_parallel_replicas_join_subquery.sql
@@ -1,5 +1,7 @@
 -- Tags: zookeeper
 
+DROP TABLE IF EXISTS join_inner_table SYNC;
+
 CREATE TABLE join_inner_table
 (
     id UUID,
@@ -23,7 +25,6 @@ SET allow_experimental_analyzer = 0;
 SET max_parallel_replicas = 3;
 SET prefer_localhost_replica = 1;
 SET cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost';
-SET use_hedged_requests = 0;
 SET joined_subquery_requires_alias = 0;
 
 SELECT '=============== INNER QUERY (NO PARALLEL) ===============';
@@ -78,6 +79,8 @@ ORDER BY is_initial_query, c, query;
 
 ---- Query with JOIN
 
+DROP TABLE IF EXISTS join_outer_table SYNC;
+
 CREATE TABLE join_outer_table
 (
     id UUID,
diff --git a/tests/queries/0_stateless/02732_rename_after_processing.sh b/tests/queries/0_stateless/02732_rename_after_processing.sh
index cdbc9892bc7..9d44ff9fc34 100755
--- a/tests/queries/0_stateless/02732_rename_after_processing.sh
+++ b/tests/queries/0_stateless/02732_rename_after_processing.sh
@@ -5,7 +5,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 # see 01658_read_file_to_stringcolumn.sh
-CLICKHOUSE_USER_FILES_PATH=$(clickhouse-client --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+CLICKHOUSE_USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path, _file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 # Prepare data
 unique_name=${CLICKHOUSE_TEST_UNIQUE_NAME}
diff --git a/tests/queries/0_stateless/02751_multiif_to_if_crash.reference b/tests/queries/0_stateless/02751_multiif_to_if_crash.reference
index d00491fd7e5..27eb24fce3f 100644
--- a/tests/queries/0_stateless/02751_multiif_to_if_crash.reference
+++ b/tests/queries/0_stateless/02751_multiif_to_if_crash.reference
@@ -1 +1,3 @@
 1
+9
+3
diff --git a/tests/queries/0_stateless/02751_multiif_to_if_crash.sql b/tests/queries/0_stateless/02751_multiif_to_if_crash.sql
index 05233c2c4b9..6b9c221c95c 100644
--- a/tests/queries/0_stateless/02751_multiif_to_if_crash.sql
+++ b/tests/queries/0_stateless/02751_multiif_to_if_crash.sql
@@ -1 +1,3 @@
 SELECT sum(A) FROM (SELECT multiIf(1, 1, NULL) as A);
+SELECT sum(multiIf(number = NULL, 65536, 3))  FROM numbers(3);
+SELECT multiIf(NULL, 65536 :: UInt32, 3 :: Int32);
diff --git a/tests/queries/0_stateless/02751_parallel_replicas_bug_chunkinfo_not_set.sql b/tests/queries/0_stateless/02751_parallel_replicas_bug_chunkinfo_not_set.sql
index 2ea2cecc7b5..5ec0a1fcc31 100644
--- a/tests/queries/0_stateless/02751_parallel_replicas_bug_chunkinfo_not_set.sql
+++ b/tests/queries/0_stateless/02751_parallel_replicas_bug_chunkinfo_not_set.sql
@@ -18,7 +18,7 @@ INSERT INTO join_inner_table__fuzz_1 SELECT
 FROM generateRandom('number Int64, value1 String, value2 String, time Int64', 1, 10, 2)
 LIMIT 100;
 
-SET max_parallel_replicas = 3,  prefer_localhost_replica = 1, use_hedged_requests = 0, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_parallel_reading_from_replicas = 1;
+SET max_parallel_replicas = 3,  prefer_localhost_replica = 1, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_parallel_reading_from_replicas = 1;
 
 -- SELECT query will write a Warning to the logs
 SET send_logs_level='error';
diff --git a/tests/queries/0_stateless/02760_dictionaries_memory.sql.j2 b/tests/queries/0_stateless/02760_dictionaries_memory.sql.j2
index ea979506e07..67e8f098217 100644
--- a/tests/queries/0_stateless/02760_dictionaries_memory.sql.j2
+++ b/tests/queries/0_stateless/02760_dictionaries_memory.sql.j2
@@ -14,6 +14,7 @@ SET max_memory_usage='4Mi';
     'FLAT(INITIAL_ARRAY_SIZE 3_000_000 MAX_ARRAY_SIZE 3_000_000)',
     'HASHED()',
     'HASHED_ARRAY()',
+    'HASHED_ARRAY(SHARDS 2)',
     'SPARSE_HASHED()',
     'SPARSE_HASHED(SHARDS 2 /* shards are special, they use threads */)',
 ] %}
diff --git a/tests/queries/0_stateless/02764_parallel_replicas_plain_merge_tree.sql b/tests/queries/0_stateless/02764_parallel_replicas_plain_merge_tree.sql
index aaf68dfd300..9caa6f76e89 100644
--- a/tests/queries/0_stateless/02764_parallel_replicas_plain_merge_tree.sql
+++ b/tests/queries/0_stateless/02764_parallel_replicas_plain_merge_tree.sql
@@ -1,7 +1,7 @@
 CREATE TABLE IF NOT EXISTS parallel_replicas_plain (x String) ENGINE=MergeTree() ORDER BY x;
 INSERT INTO parallel_replicas_plain SELECT toString(number) FROM numbers(10);
 
-SET max_parallel_replicas=3, allow_experimental_parallel_reading_from_replicas=1, use_hedged_requests=0, cluster_for_parallel_replicas='parallel_replicas';
+SET max_parallel_replicas=3, allow_experimental_parallel_reading_from_replicas=1, cluster_for_parallel_replicas='parallel_replicas';
 SET send_logs_level='error';
 SET parallel_replicas_for_non_replicated_merge_tree = 0;
 
diff --git a/tests/queries/0_stateless/02765_parallel_replicas_final_modifier.sql b/tests/queries/0_stateless/02765_parallel_replicas_final_modifier.sql
index f447051e1e5..6c121802b06 100644
--- a/tests/queries/0_stateless/02765_parallel_replicas_final_modifier.sql
+++ b/tests/queries/0_stateless/02765_parallel_replicas_final_modifier.sql
@@ -2,7 +2,7 @@ CREATE TABLE IF NOT EXISTS parallel_replicas_final (x String) ENGINE=ReplacingMe
 
 INSERT INTO parallel_replicas_final SELECT toString(number) FROM numbers(10);
 
-SET max_parallel_replicas=3, allow_experimental_parallel_reading_from_replicas=1, use_hedged_requests=0, cluster_for_parallel_replicas='parallel_replicas';
+SET max_parallel_replicas=3, allow_experimental_parallel_reading_from_replicas=1, cluster_for_parallel_replicas='parallel_replicas';
 SET parallel_replicas_for_non_replicated_merge_tree = 1;
 
 SELECT * FROM parallel_replicas_final FINAL FORMAT Null;
diff --git a/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql b/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
index 020a429c109..38d592201e3 100644
--- a/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
+++ b/tests/queries/0_stateless/02769_parallel_replicas_unavailable_shards.sql
@@ -4,7 +4,7 @@ INSERT INTO test_parallel_replicas_unavailable_shards SELECT * FROM numbers(10);
 
 SYSTEM FLUSH LOGS;
 
-SET allow_experimental_parallel_reading_from_replicas=2, max_parallel_replicas=11, use_hedged_requests=0, cluster_for_parallel_replicas='parallel_replicas', parallel_replicas_for_non_replicated_merge_tree=1;
+SET allow_experimental_parallel_reading_from_replicas=2, max_parallel_replicas=11, cluster_for_parallel_replicas='parallel_replicas', parallel_replicas_for_non_replicated_merge_tree=1;
 SET send_logs_level='error';
 SELECT count() FROM test_parallel_replicas_unavailable_shards WHERE NOT ignore(*);
 
diff --git a/tests/queries/0_stateless/02771_multidirectory_globs_storage_file.sh b/tests/queries/0_stateless/02771_multidirectory_globs_storage_file.sh
index 46ce3d97ba2..932837b83db 100755
--- a/tests/queries/0_stateless/02771_multidirectory_globs_storage_file.sh
+++ b/tests/queries/0_stateless/02771_multidirectory_globs_storage_file.sh
@@ -10,7 +10,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # Data preparation.
 # Now we can get the user_files_path by using the file function, we can also get it by this query:
 #  "insert into function file('exist.txt', 'CSV', 'val1 char') values ('aaaa'); select _path from file('exist.txt', 'CSV', 'val1 char')"
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 rm -rf ${user_files_path:?}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}/*
 mkdir -p ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME}/
diff --git a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
index f688db940d9..35573110550 100644
--- a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
+++ b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.reference
@@ -8,5 +8,5 @@
 5935810273536892891
 7885388429666205427
 8124171311239967992
-1	1	-- Simple query with analyzer and pure parallel replicas\nSELECT number\nFROM join_inner_table__fuzz_146_replicated\n    SETTINGS\n    allow_experimental_analyzer = 1,\n    max_parallel_replicas = 2,\n    cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\',\n    allow_experimental_parallel_reading_from_replicas = 1,\n    use_hedged_requests = 0;
-0	2	SELECT `join_inner_table__fuzz_146_replicated`.`number` AS `number` FROM `default`.`join_inner_table__fuzz_146_replicated` SETTINGS allow_experimental_analyzer = 1, max_parallel_replicas = 2, cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\', allow_experimental_parallel_reading_from_replicas = 1, use_hedged_requests = 0
+1	1	-- Simple query with analyzer and pure parallel replicas\nSELECT number\nFROM join_inner_table__fuzz_146_replicated\n    SETTINGS\n    allow_experimental_analyzer = 1,\n    max_parallel_replicas = 2,\n    cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\',\n    allow_experimental_parallel_reading_from_replicas = 1;
+0	2	SELECT `join_inner_table__fuzz_146_replicated`.`number` AS `number` FROM `default`.`join_inner_table__fuzz_146_replicated` SETTINGS allow_experimental_analyzer = 1, max_parallel_replicas = 2, cluster_for_parallel_replicas = \'test_cluster_one_shard_three_replicas_localhost\', allow_experimental_parallel_reading_from_replicas = 1
diff --git a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.sql b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.sql
index 35089c0cedb..88a0d2163d6 100644
--- a/tests/queries/0_stateless/02771_parallel_replicas_analyzer.sql
+++ b/tests/queries/0_stateless/02771_parallel_replicas_analyzer.sql
@@ -24,8 +24,7 @@ FROM join_inner_table__fuzz_146_replicated
     allow_experimental_analyzer = 1,
     max_parallel_replicas = 2,
     cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost',
-    allow_experimental_parallel_reading_from_replicas = 1,
-    use_hedged_requests = 0;
+    allow_experimental_parallel_reading_from_replicas = 1;
 
 SYSTEM FLUSH LOGS;
 -- There should be 2 different queries
diff --git a/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh b/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
index a7f71eacf0f..060efe86602 100755
--- a/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
+++ b/tests/queries/0_stateless/02782_uniq_exact_parallel_merging_bug.sh
@@ -8,12 +8,12 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CURDIR"/../shell_config.sh
 
 
-clickhouse-client -q "
+$CLICKHOUSE_CLIENT -q "
     CREATE TABLE ${CLICKHOUSE_DATABASE}.t(s String)
     ENGINE = MergeTree
     ORDER BY tuple();
 "
 
-clickhouse-client -q "insert into ${CLICKHOUSE_DATABASE}.t select number%10==0 ? toString(number) : '' from numbers_mt(1e7)"
+$CLICKHOUSE_CLIENT -q "insert into ${CLICKHOUSE_DATABASE}.t select number%10==0 ? toString(number) : '' from numbers_mt(1e7)"
 
-clickhouse-benchmark -q "select count(distinct s) from ${CLICKHOUSE_DATABASE}.t settings max_memory_usage = '50Mi'" --ignore-error -c 16 -i 1000 2>/dev/null
+$CLICKHOUSE_BENCHMARK -q "select count(distinct s) from ${CLICKHOUSE_DATABASE}.t settings max_memory_usage = '50Mi'" --ignore-error -c 16 -i 1000 2>/dev/null
diff --git a/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.sh b/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.sh
index 9cfd3a392c8..bafab249b47 100755
--- a/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.sh
+++ b/tests/queries/0_stateless/02783_parallel_replicas_trivial_count_optimization.sh
@@ -1,4 +1,6 @@
 #!/usr/bin/env bash
+# Tags: no-replicated-database
+# Tag no-replicated-database: CREATE AS SELECT is disabled
 
 CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
@@ -30,7 +32,6 @@ function run_query_with_pure_parallel_replicas () {
         --query_id "${1}_pure" \
         --max_parallel_replicas 3 \
         --prefer_localhost_replica 1 \
-        --use_hedged_requests 0 \
         --cluster_for_parallel_replicas 'test_cluster_one_shard_three_replicas_localhost' \
         --allow_experimental_parallel_reading_from_replicas 1 \
         --allow_experimental_analyzer 0
@@ -40,7 +41,6 @@ function run_query_with_pure_parallel_replicas () {
         --query_id "${1}_pure_analyzer" \
         --max_parallel_replicas 3 \
         --prefer_localhost_replica 1 \
-        --use_hedged_requests 0 \
         --cluster_for_parallel_replicas 'test_cluster_one_shard_three_replicas_localhost' \
         --allow_experimental_parallel_reading_from_replicas 1 \
         --allow_experimental_analyzer 1
@@ -56,7 +56,6 @@ function run_query_with_custom_key_parallel_replicas () {
         --query "$2" \
         --query_id "${1}_custom_key" \
         --max_parallel_replicas 3 \
-        --use_hedged_requests 0 \
         --parallel_replicas_custom_key_filter_type 'default' \
         --parallel_replicas_custom_key "$2" \
         --allow_experimental_analyzer 0
@@ -65,7 +64,6 @@ function run_query_with_custom_key_parallel_replicas () {
         --query "$2" \
         --query_id "${1}_custom_key_analyzer" \
         --max_parallel_replicas 3 \
-        --use_hedged_requests 0 \
         --parallel_replicas_custom_key_filter_type 'default' \
         --parallel_replicas_custom_key "$2" \
         --allow_experimental_analyzer 1
diff --git a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision.sh b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision.sh
index 741b51284fe..8a3b34e5cfa 100755
--- a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision.sh
+++ b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision.sh
@@ -49,7 +49,6 @@ function run_query_with_pure_parallel_replicas () {
         --query_id "${1}_pure" \
         --max_parallel_replicas 3 \
         --prefer_localhost_replica 1 \
-        --use_hedged_requests 0 \
         --cluster_for_parallel_replicas "parallel_replicas" \
         --allow_experimental_parallel_reading_from_replicas 1 \
         --parallel_replicas_for_non_replicated_merge_tree 1 \
diff --git a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
index ed68a304b85..baeeb820da5 100755
--- a/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
+++ b/tests/queries/0_stateless/02784_parallel_replicas_automatic_decision_join.sh
@@ -64,7 +64,6 @@ function run_query_with_pure_parallel_replicas () {
         --query_id "${1}_pure" \
         --max_parallel_replicas 3 \
         --prefer_localhost_replica 1 \
-        --use_hedged_requests 0 \
         --cluster_for_parallel_replicas "parallel_replicas" \
         --allow_experimental_parallel_reading_from_replicas 1 \
         --parallel_replicas_for_non_replicated_merge_tree 1 \
diff --git a/tests/queries/0_stateless/02789_jit_cannot_convert_column.reference b/tests/queries/0_stateless/02789_jit_cannot_convert_column.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02789_jit_cannot_convert_column.sql b/tests/queries/0_stateless/02789_jit_cannot_convert_column.sql
new file mode 100644
index 00000000000..f5e694a38be
--- /dev/null
+++ b/tests/queries/0_stateless/02789_jit_cannot_convert_column.sql
@@ -0,0 +1,11 @@
+SELECT
+    sum(c),
+    toInt32((h - null::Nullable(DateTime)) / 3600) + 1 AS a
+FROM
+(
+    SELECT count() AS c, h
+    FROM ( SELECT now() AS h )
+    WHERE toInt32((h - null::Nullable(DateTime)) / 3600) + 1 = 1
+    GROUP BY h
+)
+GROUP BY a settings min_count_to_compile_expression = 0;
diff --git a/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.reference b/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.reference
index 96860a2f90a..8da02f5bef6 100644
--- a/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.reference
+++ b/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.reference
@@ -2,3 +2,5 @@ s3_plain_native_copy
 Single operation copy has completed.
 s3_plain_no_native_copy
 Single part upload has completed.
+copy from s3_plain_native_copy to s3_plain_another
+Single operation copy has completed.
diff --git a/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.sh b/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.sh
index 33321607728..2b9e5296a05 100755
--- a/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.sh
+++ b/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.sh
@@ -24,5 +24,20 @@ function run_test_for_disk()
     clickhouse-disks -C "$config" --disk "$disk" remove $CLICKHOUSE_DATABASE/test.copy
 }
 
+function run_test_copy_from_s3_to_s3(){
+    local disk_src=$1 && shift
+    local disk_dest=$1 && shift
+
+    echo "copy from $disk_src to $disk_dest"
+    clickhouse-disks -C "$config" --disk "$disk_src" write  --input "$config" $CLICKHOUSE_DATABASE/test
+
+    clickhouse-disks -C "$config" --log-level test copy --disk-from "$disk_src" --disk-to "$disk_dest"  $CLICKHOUSE_DATABASE/test $CLICKHOUSE_DATABASE/test.copy |& {
+        grep -o -e "Single part upload has completed." -e "Single operation copy has completed."
+    }
+    clickhouse-disks -C "$config" --disk "$disk_dest" remove $CLICKHOUSE_DATABASE/test.copy/test
+    clickhouse-disks -C "$config" --disk "$disk_dest" remove $CLICKHOUSE_DATABASE/test.copy
+}
+
 run_test_for_disk s3_plain_native_copy
 run_test_for_disk s3_plain_no_native_copy
+run_test_copy_from_s3_to_s3 s3_plain_native_copy s3_plain_another
diff --git a/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.xml b/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.xml
index d4235a70903..4b45815a125 100644
--- a/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.xml
+++ b/tests/queries/0_stateless/02802_clickhouse_disks_s3_copy.xml
@@ -8,6 +8,13 @@
                <secret_access_key>clickhouse</secret_access_key>
                <s3_allow_native_copy>true</s3_allow_native_copy>
            </s3_plain_native_copy>
+           <s3_plain_another>
+               <type>s3_plain</type>
+               <endpoint>http://localhost:11111/test/clickhouse-disks/</endpoint>
+               <access_key_id>clickhouse</access_key_id>
+               <secret_access_key>clickhouse</secret_access_key>
+               <s3_allow_native_copy>true</s3_allow_native_copy>
+           </s3_plain_another>
 
            <s3_plain_no_native_copy>
                <type>s3_plain</type>
diff --git a/tests/queries/0_stateless/02811_parallel_replicas_prewhere_count.sql b/tests/queries/0_stateless/02811_parallel_replicas_prewhere_count.sql
index 374d73d7d03..14edeecf57e 100644
--- a/tests/queries/0_stateless/02811_parallel_replicas_prewhere_count.sql
+++ b/tests/queries/0_stateless/02811_parallel_replicas_prewhere_count.sql
@@ -13,7 +13,6 @@ SET
 skip_unavailable_shards=1,
 allow_experimental_parallel_reading_from_replicas=1,
 max_parallel_replicas=3,
-use_hedged_requests=0,
 cluster_for_parallel_replicas='parallel_replicas',
 parallel_replicas_for_non_replicated_merge_tree=1,
 parallel_replicas_min_number_of_rows_per_replica=1000;
diff --git a/tests/queries/0_stateless/02813_series_period_detect.reference b/tests/queries/0_stateless/02813_series_period_detect.reference
index f72e8498f31..e32a57d0935 100644
--- a/tests/queries/0_stateless/02813_series_period_detect.reference
+++ b/tests/queries/0_stateless/02813_series_period_detect.reference
@@ -3,3 +3,10 @@
 3
 3
 0
+62
+6
+6
+nan
+3
+0
+nan
diff --git a/tests/queries/0_stateless/02813_series_period_detect.sql b/tests/queries/0_stateless/02813_series_period_detect.sql
index e860fd75923..ef3479d321c 100644
--- a/tests/queries/0_stateless/02813_series_period_detect.sql
+++ b/tests/queries/0_stateless/02813_series_period_detect.sql
@@ -1,12 +1,22 @@
 -- Tags: no-fasttest
 
+DROP TABLE IF EXISTS tb1;
+
+CREATE TABLE tb1 (n UInt32, a Array(Int32)) engine=Memory;
+INSERT INTO tb1 VALUES (1, [10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30]), (2, [2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2]), (3, [6, 3, 4]);
+
 SELECT seriesPeriodDetectFFT([139, 87, 110, 68, 54, 50, 51, 53, 133, 86, 141, 97, 156, 94, 149, 95, 140, 77, 61, 50, 54, 47, 133, 72, 152, 94, 148, 105, 162, 101, 160, 87, 63, 53, 55, 54, 151, 103, 189, 108, 183, 113, 175, 113, 178, 90, 71, 62, 62, 65, 165, 109, 181, 115, 182, 121, 178, 114, 170]);
-SELECT seriesPeriodDetectFFT([10,20,30,10,20,30,10,20,30, 10,20,30,10,20,30,10,20,30,10,20,30]);
-SELECT seriesPeriodDetectFFT([10.1, 20.45, 40.34, 10.1, 20.45, 40.34,10.1, 20.45, 40.34,10.1, 20.45, 40.34,10.1, 20.45, 40.34,10.1, 20.45, 40.34,10.1, 20.45, 40.34, 10.1, 20.45, 40.34]);
-SELECT seriesPeriodDetectFFT([10.1, 10, 400, 10.1, 10, 400, 10.1, 10, 400,10.1, 10, 400,10.1, 10, 400,10.1, 10, 400,10.1, 10, 400,10.1, 10, 400]);
+SELECT seriesPeriodDetectFFT([10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30, 10, 20, 30]);
+SELECT seriesPeriodDetectFFT([10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34, 10.1, 20.45, 40.34]);
+SELECT seriesPeriodDetectFFT([10.1, 10, 400, 10.1, 10, 400, 10.1, 10, 400, 10.1, 10, 400, 10.1, 10, 400, 10.1, 10, 400, 10.1, 10, 400, 10.1, 10, 400]);
 SELECT seriesPeriodDetectFFT([2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 2]);
-SELECT seriesPeriodDetectFFT([1,2,3]);  -- { serverError BAD_ARGUMENTS}
+SELECT seriesPeriodDetectFFT(arrayMap(x -> sin(x / 10), range(1000)));
+SELECT seriesPeriodDetectFFT(arrayMap(x -> abs((x % 6) - 3), range(1000)));
+SELECT seriesPeriodDetectFFT(arrayMap(x -> if((x % 6) < 3, 3, 0), range(1000)));
+SELECT seriesPeriodDetectFFT([1,2,3]);
+SELECT seriesPeriodDetectFFT(a) FROM tb1;
+DROP TABLE IF EXISTS tb1;
 SELECT seriesPeriodDetectFFT(); --{ serverError NUMBER_OF_ARGUMENTS_DOESNT_MATCH}
 SELECT seriesPeriodDetectFFT([]); -- { serverError ILLEGAL_COLUMN}
 SELECT seriesPeriodDetectFFT([NULL, NULL, NULL]); -- { serverError ILLEGAL_COLUMN}
-SELECT seriesPeriodDetectFFT([10,20,30,10,202,30,NULL]); -- { serverError ILLEGAL_COLUMN }
\ No newline at end of file
+SELECT seriesPeriodDetectFFT([10, 20, 30, 10, 202, 30, NULL]); -- { serverError ILLEGAL_COLUMN }
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02817_structure_to_schema.reference b/tests/queries/0_stateless/02817_structure_to_schema.reference
index 1f39a8ed50e..9fe41d838e7 100644
--- a/tests/queries/0_stateless/02817_structure_to_schema.reference
+++ b/tests/queries/0_stateless/02817_structure_to_schema.reference
@@ -189,7 +189,7 @@ struct Message
             }
             entries @0 : List(Entry);
         }
-        e1 @0 : List(E1);
+        e1 @0 : E1;
         struct E2
         {
             struct Entry
@@ -230,9 +230,9 @@ struct Message
             }
             entries @0 : List(Entry);
         }
-        e2 @1 : List(E2);
+        e2 @1 : E2;
     }
-    c1 @0 : C1;
+    c1 @0 : List(C1);
 }
 Read/write with no schema
 0
@@ -400,49 +400,41 @@ message Message
 {
     message C1
     {
-        message E1
+        message E1Value
         {
             message E1Value
             {
-                message E1Value
-                {
-                    repeated uint32 e1Value = 1;
-                }
-                repeated E1Value e1Value = 1;
+                repeated uint32 e1Value = 1;
             }
-            map<string, E1Value> e1 = 1;
+            repeated E1Value e1Value = 1;
         }
-        repeated E1 e1 = 1;
-        message E2
+        map<string, E1Value> e1 = 1;
+        message E2Value
         {
-            message E2Value
+            message E1
             {
-                message E1
-                {
-                    repeated bytes e1 = 1;
-                }
-                repeated E1 e1 = 1;
+                repeated bytes e1 = 1;
+            }
+            repeated E1 e1 = 1;
+            message E2
+            {
+                uint32 e1 = 1;
                 message E2
                 {
-                    uint32 e1 = 1;
-                    message E2
+                    message E1
                     {
-                        message E1
-                        {
-                            repeated bytes e1 = 1;
-                        }
-                        repeated E1 e1 = 1;
-                        uint32 e2 = 2;
+                        repeated bytes e1 = 1;
                     }
-                    E2 e2 = 2;
+                    repeated E1 e1 = 1;
+                    uint32 e2 = 2;
                 }
-                repeated E2 e2 = 2;
+                E2 e2 = 2;
             }
-            map<string, E2Value> e2 = 1;
+            repeated E2 e2 = 2;
         }
-        repeated E2 e2 = 2;
+        map<string, E2Value> e2 = 2;
     }
-    C1 c1 = 1;
+    repeated C1 c1 = 1;
 }
 Read/write with no schema
 0
diff --git a/tests/queries/0_stateless/02833_local_with_dialect.reference b/tests/queries/0_stateless/02833_local_with_dialect.reference
index dbb67375997..573541ac970 100644
--- a/tests/queries/0_stateless/02833_local_with_dialect.reference
+++ b/tests/queries/0_stateless/02833_local_with_dialect.reference
@@ -1,2 +1 @@
 0
-[?2004h[?2004lBye.
diff --git a/tests/queries/0_stateless/02833_local_with_dialect.sh b/tests/queries/0_stateless/02833_local_with_dialect.sh
index 012a6d91269..de009961cba 100755
--- a/tests/queries/0_stateless/02833_local_with_dialect.sh
+++ b/tests/queries/0_stateless/02833_local_with_dialect.sh
@@ -6,4 +6,5 @@ CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 . "$CUR_DIR"/../shell_config.sh
 
 
-echo "exit" | ${CLICKHOUSE_LOCAL} --query "from s\"SELECT * FROM numbers(1)\"" --dialect prql --interactive
+# Remove last line since the good bye message changes depending on the date
+echo "exit" | ${CLICKHOUSE_LOCAL} --query "from s\"SELECT * FROM numbers(1)\"" --dialect prql --interactive | head -n -1
diff --git a/tests/queries/0_stateless/02835_parallel_replicas_over_distributed.sql b/tests/queries/0_stateless/02835_parallel_replicas_over_distributed.sql
index 60aa5748575..1e6f9304c0c 100644
--- a/tests/queries/0_stateless/02835_parallel_replicas_over_distributed.sql
+++ b/tests/queries/0_stateless/02835_parallel_replicas_over_distributed.sql
@@ -14,13 +14,13 @@ insert into test select *, today() from numbers(100);
 
 SELECT count(), min(id), max(id), avg(id)
 FROM test_d
-SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1, use_hedged_requests=0;
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1;
 
 insert into test select *, today() from numbers(100);
 
 SELECT count(), min(id), max(id), avg(id)
 FROM test_d
-SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1, use_hedged_requests=0;
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1;
 
 -- 2 shards
 
@@ -38,10 +38,10 @@ insert into test2 select *, today() from numbers(100);
 
 SELECT count(), min(id), max(id), avg(id)
 FROM test2_d
-SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1, use_hedged_requests=0;
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1;
 
 insert into test2 select *, today() from numbers(100);
 
 SELECT count(), min(id), max(id), avg(id)
 FROM test2_d
-SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1, use_hedged_requests=0;
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1;
diff --git a/tests/queries/0_stateless/02841_group_array_sorted.reference b/tests/queries/0_stateless/02841_group_array_sorted.reference
deleted file mode 100644
index 1043f949590..00000000000
--- a/tests/queries/0_stateless/02841_group_array_sorted.reference
+++ /dev/null
@@ -1,12 +0,0 @@
-[0,1,2,3,4]
-[0,1,2,3,4]
-[0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99]
-['0','1','10','11','12','13','14','15','16','17','18','19','2','20','21','22','23','24','25','26','27','28','29','3','4','5','6','7','8','9']
-[0,0,1,1,2,2,3,3,4,4]
-[[1,2,3,4],[2,3,4,5],[3,4,5,6]]
-[(2,1),(15,25),(30,60),(100,200)]
-[0.2,2.2,6.6,12.5]
-['AAA','Aaa','aaa','abc','bbc']
-1000000
-1000000
-[0,1]
diff --git a/tests/queries/0_stateless/02841_group_array_sorted.sql b/tests/queries/0_stateless/02841_group_array_sorted.sql
deleted file mode 100644
index a8cd6791ff3..00000000000
--- a/tests/queries/0_stateless/02841_group_array_sorted.sql
+++ /dev/null
@@ -1,41 +0,0 @@
-SELECT groupArraySorted(5)(number) FROM numbers(100);
-
-SELECT groupArraySorted(10)(number) FROM numbers(5);
-
-SELECT groupArraySorted(100)(number) FROM numbers(1000);
-
-SELECT groupArraySorted(30)(str) FROM (SELECT toString(number) as str FROM numbers(30));
-
-SELECT groupArraySorted(10)(toInt64(number/2)) FROM numbers(100);
-
-DROP TABLE IF EXISTS test;
-CREATE TABLE test (a Array(UInt64)) engine=MergeTree ORDER BY a;
-INSERT INTO test VALUES ([3,4,5,6]), ([1,2,3,4]), ([2,3,4,5]);
-SELECT groupArraySorted(3)(a) FROM test;
-DROP TABLE test;
-
-CREATE TABLE IF NOT EXISTS test (id Int32, data Tuple(Int32, Int32)) ENGINE = MergeTree() ORDER BY id;
-INSERT INTO test (id, data) VALUES (1, (100, 200)), (2, (15, 25)), (3, (2, 1)), (4, (30, 60));
-SELECT groupArraySorted(4)(data) FROM test;
-DROP TABLE test;
-
-CREATE TABLE IF NOT EXISTS test (id Int32, data Decimal32(2)) ENGINE = MergeTree() ORDER BY id;
-INSERT INTO test (id, data) VALUES (1, 12.5), (2, 0.2), (3, 6.6), (4, 2.2);
-SELECT groupArraySorted(4)(data) FROM test;
-DROP TABLE test;
-
-CREATE TABLE IF NOT EXISTS test (id Int32, data FixedString(3)) ENGINE = MergeTree() ORDER BY id;
-INSERT INTO test (id, data) VALUES (1, 'AAA'), (2, 'bbc'), (3, 'abc'), (4, 'aaa'), (5, 'Aaa');
-SELECT groupArraySorted(5)(data) FROM test;
-DROP TABLE test;
-
-CREATE TABLE test (id Decimal(76, 53), str String) ENGINE = MergeTree ORDER BY id;
-INSERT INTO test SELECT number, 'test' FROM numbers(1000000);
-SELECT count(id) FROM test;
-SELECT count(concat(toString(id), 'a')) FROM test;
-DROP TABLE test;
-
-CREATE TABLE test (id UInt64, agg AggregateFunction(groupArraySorted(2), UInt64)) engine=MergeTree ORDER BY id;
-INSERT INTO test SELECT 1, groupArraySortedState(2)(number) FROM numbers(10);
-SELECT groupArraySortedMerge(2)(agg) FROM test;
-DROP TABLE test;
diff --git a/tests/queries/0_stateless/02841_parallel_replicas_summary.sh b/tests/queries/0_stateless/02841_parallel_replicas_summary.sh
index 792c45b06d6..c82d2c8b0c0 100755
--- a/tests/queries/0_stateless/02841_parallel_replicas_summary.sh
+++ b/tests/queries/0_stateless/02841_parallel_replicas_summary.sh
@@ -36,7 +36,6 @@ echo "
         cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost',
         allow_experimental_parallel_reading_from_replicas = 2,
         parallel_replicas_for_non_replicated_merge_tree = 1,
-        use_hedged_requests = 0,
         interactive_delay=0
     "\
     | ${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}&wait_end_of_query=1&query_id=${query_id_base}_interactive_0" --data-binary @- -vvv 2>&1 \
@@ -51,7 +50,6 @@ echo "
         cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost',
         allow_experimental_parallel_reading_from_replicas = 2,
         parallel_replicas_for_non_replicated_merge_tree = 1,
-        use_hedged_requests = 0,
         interactive_delay=99999999999
     "\
     | ${CLICKHOUSE_CURL} -sS "${CLICKHOUSE_URL}&wait_end_of_query=1&query_id=${query_id_base}_interactive_high" --data-binary @- -vvv 2>&1 \
diff --git a/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.reference b/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.reference
index b4407dea13a..cf7f7764253 100644
--- a/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.reference
+++ b/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.reference
@@ -1,7 +1,17 @@
 []
 [(1,10)]
 [(1,10),(10,70)]
-[(1,10),(3,15),(5,40),(10,70)]
-[(0.02,0.16),(0.06,0.73),(0.08,0.88),(0.09,0),(0.11,0.31),(0.15,0.09),(0.19,0.27),(0.2,0.24),(0.21,0.46),(0.23,0.23),(0.25,0.34),(0.29,0.16),(0.36,0.99),(0.37,0.86),(0.38,0.75),(0.39,0.86),(0.41,0.63),(0.45,0.86),(0.47,0.06),(0.98,0.09)]
-[('2023-01-14 00:00:00.000',35.96528042030847),('2023-03-15 00:00:00.000',98.77709508458238),('2023-06-05 00:00:00.000',8.107958052612418),('2023-09-29 00:00:00.000',80.05338096818797),('2023-12-31 00:00:00.000',98.52375935588333)]
-[('2023-01-14 00:00:00.000',35.96528042030847),('2023-03-15 00:00:00.000',98.77709508458238),('2023-06-05 00:00:00.000',8.107958052612418),('2023-09-29 00:00:00.000',80.05338096818797),('2023-12-31 00:00:00.000',98.52375935588333)]
+[(1,10),(3,15),(9,55),(10,70)]
+[(0.02,0.16),(0.08,0.88),(0.09,0),(0.15,0.09),(0.21,0.46),(0.23,0.23),(0.29,0.16),(0.37,0.86),(0.39,0.86),(0.47,0.06),(0.48,0.57),(0.52,0.11),(0.6,0.64),(0.63,0.25),(0.7,0.25),(0.73,0.95),(0.83,0.67),(0.87,0.15),(0.91,0.62),(0.98,0.09)]
+[('2023-01-14 00:00:00.000',35.96528042030847),('2023-03-15 00:00:00.000',98.77709508458238),('2023-06-05 00:00:00.000',8.107958052612418),('2023-12-18 00:00:00.000',12.832032764204616),('2023-12-31 00:00:00.000',98.52375935588333)]
+[('2023-01-14 00:00:00.000',35.96528042030847),('2023-03-15 00:00:00.000',98.77709508458238),('2023-06-05 00:00:00.000',8.107958052612418),('2023-12-18 00:00:00.000',12.832032764204616),('2023-12-31 00:00:00.000',98.52375935588333)]
+(9908,908)	9908	10
+(9918,918)	9918	10
+(9928,928)	9928	10
+(9938,938)	9938	10
+(9948,948)	9948	10
+(9958,958)	9958	10
+(9968,968)	9968	10
+(9978,978)	9978	10
+(9988,988)	9988	10
+(9999,999)	9999	11
diff --git a/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.sql b/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.sql
index 2eb8754cb64..8a6a2358918 100644
--- a/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.sql
+++ b/tests/queries/0_stateless/02842_largestTriangleThreeBuckets_aggregate_function.sql
@@ -44,4 +44,20 @@ select largestTriangleThreeBuckets(5)(x, y) from largestTriangleThreeBucketsTest
 
 select lttb(5)(x, y) from largestTriangleThreeBucketsTestDateTime64Float64;
 
-drop table largestTriangleThreeBucketsTestDateTime64Float64;
\ No newline at end of file
+drop table largestTriangleThreeBucketsTestDateTime64Float64;
+
+CREATE TABLE largestTriangleTreeBucketsBucketSizeTest
+(
+    x UInt32,
+    y UInt32
+) ENGINE = MergeTree ORDER BY x;
+
+INSERT INTO largestTriangleTreeBucketsBucketSizeTest (x, y) SELECT (number + 1) AS x, (x % 1000) AS y FROM numbers(9999);
+
+SELECT 
+  arrayJoin(lttb(1000)(x, y)) AS point, 
+  tupleElement(point, 1) AS point_x, 
+  point_x - neighbor(point_x, -1) AS point_x_diff_with_previous_row 
+FROM largestTriangleTreeBucketsBucketSizeTest LIMIT 990, 10;
+
+DROP TABLE largestTriangleTreeBucketsBucketSizeTest;
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02861_index_set_incorrect_args.sql b/tests/queries/0_stateless/02861_index_set_incorrect_args.sql
index fa51f5c9abc..17b505cd051 100644
--- a/tests/queries/0_stateless/02861_index_set_incorrect_args.sql
+++ b/tests/queries/0_stateless/02861_index_set_incorrect_args.sql
@@ -2,5 +2,5 @@
 DROP TABLE IF EXISTS set_index__fuzz_41;
 CREATE TABLE set_index__fuzz_41 (`a` Date, `b` Nullable(DateTime64(3)), INDEX b_set b TYPE set(0) GRANULARITY 1) ENGINE = MergeTree ORDER BY tuple();
 INSERT INTO set_index__fuzz_41 (a) VALUES (today());
-SELECT b FROM set_index__fuzz_41 WHERE and(b = 256) SETTINGS force_data_skipping_indices = 'b_set', optimize_move_to_prewhere = 0, max_parallel_replicas=2, parallel_replicas_for_non_replicated_merge_tree=1, allow_experimental_parallel_reading_from_replicas=2, use_hedged_requests=0; -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
+SELECT b FROM set_index__fuzz_41 WHERE and(b = 256) SETTINGS force_data_skipping_indices = 'b_set', optimize_move_to_prewhere = 0, max_parallel_replicas=2, parallel_replicas_for_non_replicated_merge_tree=1, allow_experimental_parallel_reading_from_replicas=2; -- { serverError TOO_FEW_ARGUMENTS_FOR_FUNCTION }
 DROP TABLE set_index__fuzz_41;
diff --git a/tests/queries/0_stateless/02861_replacing_merge_tree_with_cleanup.sql b/tests/queries/0_stateless/02861_replacing_merge_tree_with_cleanup.sql
index 7b78e2900e7..4cd44a131e3 100644
--- a/tests/queries/0_stateless/02861_replacing_merge_tree_with_cleanup.sql
+++ b/tests/queries/0_stateless/02861_replacing_merge_tree_with_cleanup.sql
@@ -2,7 +2,8 @@ DROP TABLE IF EXISTS test;
 CREATE TABLE test (uid String, version UInt32, is_deleted UInt8) ENGINE = ReplacingMergeTree(version, is_deleted) Order by (uid) SETTINGS vertical_merge_algorithm_min_rows_to_activate = 1,
     vertical_merge_algorithm_min_columns_to_activate = 0,
     min_rows_for_wide_part = 1,
-    min_bytes_for_wide_part = 1;
+    min_bytes_for_wide_part = 1,
+    allow_experimental_replacing_merge_with_cleanup=1;
 
 -- Expect d6 to be version=3 is_deleted=false
 INSERT INTO test (*) VALUES ('d1', 1, 0), ('d1', 2, 1), ('d1', 3, 0), ('d1', 4, 1), ('d1', 5, 0), ('d2', 1, 0), ('d3', 1, 0), ('d4', 1, 0),  ('d5', 1, 0), ('d6', 1, 0), ('d6', 3, 0);
diff --git a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql b/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql
index 0678023f2f4..7ba122a7155 100644
--- a/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql
+++ b/tests/queries/0_stateless/02862_index_inverted_incorrect_args.sql
@@ -3,7 +3,7 @@ DROP TABLE IF EXISTS tab;
 SET allow_experimental_inverted_index=1;
 CREATE TABLE tab (`k` UInt64, `s` Map(String, String), INDEX af mapKeys(s) TYPE inverted(2) GRANULARITY 1) ENGINE = MergeTree ORDER BY k SETTINGS index_granularity = 2, index_granularity_bytes = '10Mi';
 INSERT INTO tab (k) VALUES (0);
-SELECT * FROM tab PREWHERE (s[NULL]) = 'Click a03' SETTINGS allow_experimental_analyzer=1; -- { serverError ILLEGAL_TYPE_OF_COLUMN_FOR_FILTER }
+SELECT * FROM tab PREWHERE (s[NULL]) = 'Click a03' SETTINGS allow_experimental_analyzer=1;
 SELECT * FROM tab PREWHERE (s[1]) = 'Click a03' SETTINGS allow_experimental_analyzer=1; -- { serverError ILLEGAL_TYPE_OF_ARGUMENT }
 SELECT * FROM tab PREWHERE (s['foo']) = 'Click a03' SETTINGS allow_experimental_analyzer=1;
 DROP TABLE tab;
diff --git a/tests/queries/0_stateless/02864_statistic_exception.sql b/tests/queries/0_stateless/02864_statistic_exception.sql
index c37f6b1ce06..092fa9bda85 100644
--- a/tests/queries/0_stateless/02864_statistic_exception.sql
+++ b/tests/queries/0_stateless/02864_statistic_exception.sql
@@ -47,7 +47,7 @@ ALTER TABLE t1 MATERIALIZE STATISTIC b TYPE tdigest; -- { serverError ILLEGAL_ST
 
 ALTER TABLE t1 ADD STATISTIC a TYPE tdigest;
 ALTER TABLE t1 ADD STATISTIC b TYPE tdigest;
-ALTER TABLE t1 MODIFY COLUMN a Float64 TTL now() + INTERVAL 1 MONTH;
+ALTER TABLE t1 MODIFY COLUMN a Float64 TTL toDateTime(b) + INTERVAL 1 MONTH;
 ALTER TABLE t1 MODIFY COLUMN a Int64; -- { serverError ALTER_OF_COLUMN_IS_FORBIDDEN }
 
 DROP TABLE t1;
diff --git a/tests/queries/0_stateless/02869_parallel_replicas_read_from_several.sql b/tests/queries/0_stateless/02869_parallel_replicas_read_from_several.sql
index 9559b46fa08..e040fae1fa6 100644
--- a/tests/queries/0_stateless/02869_parallel_replicas_read_from_several.sql
+++ b/tests/queries/0_stateless/02869_parallel_replicas_read_from_several.sql
@@ -24,5 +24,5 @@ system sync replica t3;
 
 SELECT count(), min(k), max(k), avg(k)
 FROM t1
-SETTINGS allow_experimental_parallel_reading_from_replicas = 1, max_parallel_replicas = 3, prefer_localhost_replica = 0, use_hedged_requests=0,
+SETTINGS allow_experimental_parallel_reading_from_replicas = 1, max_parallel_replicas = 3, prefer_localhost_replica = 0,
          cluster_for_parallel_replicas='test_cluster_one_shard_three_replicas_localhost', parallel_replicas_single_task_marks_count_multiplier = 0.001;
diff --git a/tests/queries/0_stateless/02874_array_random_sample.sh b/tests/queries/0_stateless/02874_array_random_sample.sh
index fe136d6d5d2..b5bfc422b5a 100755
--- a/tests/queries/0_stateless/02874_array_random_sample.sh
+++ b/tests/queries/0_stateless/02874_array_random_sample.sh
@@ -11,7 +11,7 @@ passed_tests=0
 
 # Test Function for Integer Arrays
 run_integer_test() {
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([1,2,3], 2)")
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([1,2,3], 2)")
     mapfile -t sorted_result < <(echo "$query_result" | tr -d '[]' | tr ',' '\n' | sort -n)
     declare -A expected_outcomes
     expected_outcomes["1 2"]=1
@@ -34,7 +34,7 @@ run_integer_test() {
 
 # Test Function for String Arrays
 run_string_test() {
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample(['a','b','c'], 2)")
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample(['a','b','c'], 2)")
     mapfile -t sorted_result < <(echo "$query_result" | tr -d "[]'" | tr ',' '\n' | sort)
     declare -A expected_outcomes
     expected_outcomes["a b"]=1
@@ -57,7 +57,7 @@ run_string_test() {
 
 # Test Function for Nested Arrays
 run_nested_array_test() {
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([[7,2],[3,4],[7,6]], 2)")
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([[7,2],[3,4],[7,6]], 2)")
     # Convert to a space-separated string for easy sorting.
     converted_result=$(echo "$query_result" | tr -d '[]' | tr ',' ' ')
 
@@ -87,7 +87,7 @@ run_nested_array_test() {
 
 # Test Function for K > array.size
 run_higher_k_test() {
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([1,2,3], 5)")
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([1,2,3], 5)")
     mapfile -t sorted_result < <(echo "$query_result" | tr -d '[]' | tr ',' '\n' | sort -n)
     sorted_original=("1" "2" "3")
 
@@ -111,7 +111,7 @@ run_higher_k_test() {
 
 # Test Function for Integer Arrays with samples = 0
 run_integer_with_samples_0_test() {
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([1,2,3], 0)")
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([1,2,3], 0)")
     mapfile -t sorted_result < <(echo "$query_result" | tr -d '[]' | tr ',' '\n' | sort -n)
 
     # An empty array should produce an empty string after transformations
@@ -137,7 +137,7 @@ run_integer_with_samples_0_test() {
 
 # Test Function for Empty Array with K > 0
 run_empty_array_with_k_test() {
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([], 5)")
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([], 5)")
 
     if [[ "$query_result" == "[]" ]]; then
         echo "Empty Array with K > 0 Test: Passed"
@@ -153,7 +153,7 @@ run_empty_array_with_k_test() {
 # Test Function for Non-Unsigned-Integer K
 run_non_unsigned_integer_k_test() {
     # Test with negative integer
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([1, 2, 3], -5)" 2>&1)
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([1, 2, 3], -5)" 2>&1)
     if [[ "$query_result" == *"ILLEGAL_TYPE_OF_ARGUMENT"* ]]; then
         echo "Non-Unsigned-Integer K Test (Negative Integer): Passed"
         ((passed_tests++))
@@ -165,7 +165,7 @@ run_non_unsigned_integer_k_test() {
     ((total_tests++))
 
     # Test with string
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([1, 2, 3], 'a')" 2>&1)
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([1, 2, 3], 'a')" 2>&1)
     if [[ "$query_result" == *"ILLEGAL_TYPE_OF_ARGUMENT"* ]]; then
         echo "Non-Unsigned-Integer K Test (String): Passed"
         ((passed_tests++))
@@ -177,7 +177,7 @@ run_non_unsigned_integer_k_test() {
     ((total_tests++))
 
     # Test with floating-point number
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample([1, 2, 3], 1.5)" 2>&1)
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample([1, 2, 3], 1.5)" 2>&1)
     if [[ "$query_result" == *"ILLEGAL_TYPE_OF_ARGUMENT"* ]]; then
         echo "Non-Unsigned-Integer K Test (Floating-Point): Passed"
         ((passed_tests++))
@@ -193,18 +193,18 @@ run_non_unsigned_integer_k_test() {
 run_multi_row_scalar_k_test() {
     # Create a table. Use a random database name as tests potentially run in parallel.
     db=`tr -dc A-Za-z0-9 </dev/urandom | head -c 13`
-    clickhouse-client -q "DROP DATABASE IF EXISTS ${db}"
-    clickhouse-client -q "CREATE DATABASE ${db}"
-    clickhouse-client -q "CREATE TABLE ${db}.array_test (arr Array(Int32)) ENGINE = Memory"
+    $CLICKHOUSE_CLIENT_BINARY -q "DROP DATABASE IF EXISTS ${db}"
+    $CLICKHOUSE_CLIENT_BINARY -q "CREATE DATABASE ${db}"
+    $CLICKHOUSE_CLIENT_BINARY -q "CREATE TABLE ${db}.array_test (arr Array(Int32)) ENGINE = Memory"
 
     # Insert multi-row data into the table
-    clickhouse-client -q "INSERT INTO ${db}.array_test VALUES ([1, 2, 3]), ([4, 5, 6]), ([7, 8, 9])"
+    $CLICKHOUSE_CLIENT_BINARY -q "INSERT INTO ${db}.array_test VALUES ([1, 2, 3]), ([4, 5, 6]), ([7, 8, 9])"
 
     # Query using arrayRandomSample function and store the result, k is scalar here (for example, 2)
-    query_result=$(clickhouse-client -q "SELECT arrayRandomSample(arr, 2) FROM ${db}.array_test")
+    query_result=$($CLICKHOUSE_CLIENT_BINARY -q "SELECT arrayRandomSample(arr, 2) FROM ${db}.array_test")
 
     # Drop the table
-    clickhouse-client -q "DROP DATABASE ${db}"
+    $CLICKHOUSE_CLIENT_BINARY -q "DROP DATABASE ${db}"
 
     # Validate the output here
     is_test_passed=1  # flag to indicate if the test passed; 1 means passed, 0 means failed
diff --git a/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.reference b/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.reference
index 573541ac970..10fcc44daed 100644
--- a/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.reference
+++ b/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.reference
@@ -1 +1,28 @@
+5879429	2023-07-01 03:50:35	2023-07-01 03:50:35	-278
+5881397	2023-07-01 06:22:26	2023-07-01 06:22:27	2807
+5925060	2023-07-04 00:24:03	2023-07-04 00:24:02	-12
+5936591	2023-07-04 07:37:19	2023-07-04 07:37:18	-12
+5940709	2023-07-04 09:13:35	2023-07-04 09:13:35	2820
+5942342	2023-07-04 09:58:00	2023-07-04 09:57:59	-12
+5952231	2023-07-04 22:33:24	2023-07-04 22:33:24	1692
+5959449	2023-07-05 04:32:55	2023-07-05 04:32:54	-12
+5963240	2023-07-05 06:37:08	2023-07-05 06:37:09	1709
+5965742	2023-07-05 07:27:01	2023-07-05 07:27:02	1709
+5969948	2023-07-05 08:44:36	2023-07-05 08:44:37	2278
+5971673	2023-07-05 09:14:09	2023-07-05 09:14:09	5695
+6012987	2023-07-06 20:52:28	2023-07-06 20:52:27	-536
+0
+5879429	2023-07-01 03:50:35	2023-07-01 03:50:35	-278
+5881397	2023-07-01 06:22:26	2023-07-01 06:22:27	2807
+5925060	2023-07-04 00:24:03	2023-07-04 00:24:02	-12
+5936591	2023-07-04 07:37:19	2023-07-04 07:37:18	-12
+5940709	2023-07-04 09:13:35	2023-07-04 09:13:35	2820
+5942342	2023-07-04 09:58:00	2023-07-04 09:57:59	-12
+5952231	2023-07-04 22:33:24	2023-07-04 22:33:24	1692
+5959449	2023-07-05 04:32:55	2023-07-05 04:32:54	-12
+5963240	2023-07-05 06:37:08	2023-07-05 06:37:09	1709
+5965742	2023-07-05 07:27:01	2023-07-05 07:27:02	1709
+5969948	2023-07-05 08:44:36	2023-07-05 08:44:37	2278
+5971673	2023-07-05 09:14:09	2023-07-05 09:14:09	5695
+6012987	2023-07-06 20:52:28	2023-07-06 20:52:27	-536
 0
diff --git a/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.sql b/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.sql
index 4e91c2e3167..5557c572696 100644
--- a/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.sql
+++ b/tests/queries/0_stateless/02875_final_invalid_read_ranges_bug.sql
@@ -1,3 +1,4 @@
+DROP TABLE IF EXISTS t;
 CREATE TABLE t
 (
   tid UInt64,
@@ -13,8 +14,14 @@ SETTINGS index_granularity = 1;
 
 INSERT INTO t VALUES (5879429,'2023-07-01 03:50:35','2023-07-01 03:50:35',-278) (5881397,'2023-07-01 06:22:26','2023-07-01 06:22:27',2807) (5925060,'2023-07-04 00:24:03','2023-07-04 00:24:02',-12) (5936591,'2023-07-04 07:37:19','2023-07-04 07:37:18',-12) (5940709,'2023-07-04 09:13:35','2023-07-04 09:13:35',2820) (5942342,'2023-07-04 09:58:00','2023-07-04 09:57:59',-12) (5952231,'2023-07-04 22:33:24','2023-07-04 22:33:24',1692) (5959449,'2023-07-05 04:32:55','2023-07-05 04:32:54',-12) (5963240,'2023-07-05 06:37:08','2023-07-05 06:37:09',1709) (5965742,'2023-07-05 07:27:01','2023-07-05 07:27:02',1709) (5969948,'2023-07-05 08:44:36','2023-07-05 08:44:37',2278) (5971673,'2023-07-05 09:14:09','2023-07-05 09:14:09',5695) (6012987,'2023-07-06 20:52:28','2023-07-06 20:52:27',-536);
 
-SELECT sum(amount)
-FROM t FINAL
-WHERE (processed_at >= '2023-09-19 00:00:00') AND (processed_at <= '2023-09-20 01:00:00');
+SELECT tid, processed_at, created_at, amount FROM t FINAL ORDER BY tid;
+
+SELECT sum(amount) FROM t FINAL WHERE (processed_at >= '2023-09-19 00:00:00') AND (processed_at <= '2023-09-20 01:00:00');
+
+INSERT INTO t VALUES (5879429,'2023-07-01 03:50:35','2023-07-01 03:50:35',-278) (5881397,'2023-07-01 06:22:26','2023-07-01 06:22:27',2807) (5925060,'2023-07-04 00:24:03','2023-07-04 00:24:02',-12) (5936591,'2023-07-04 07:37:19','2023-07-04 07:37:18',-12) (5940709,'2023-07-04 09:13:35','2023-07-04 09:13:35',2820) (5942342,'2023-07-04 09:58:00','2023-07-04 09:57:59',-12) (5952231,'2023-07-04 22:33:24','2023-07-04 22:33:24',1692) (5959449,'2023-07-05 04:32:55','2023-07-05 04:32:54',-12) (5963240,'2023-07-05 06:37:08','2023-07-05 06:37:09',1709) (5965742,'2023-07-05 07:27:01','2023-07-05 07:27:02',1709) (5969948,'2023-07-05 08:44:36','2023-07-05 08:44:37',2278) (5971673,'2023-07-05 09:14:09','2023-07-05 09:14:09',5695) (6012987,'2023-07-06 20:52:28','2023-07-06 20:52:27',-536);
+
+SELECT tid, processed_at, created_at, amount FROM t FINAL ORDER BY tid;
+
+SELECT sum(amount) FROM t FINAL WHERE (processed_at >= '2023-09-19 00:00:00') AND (processed_at <= '2023-09-20 01:00:00');
 
 DROP TABLE t;
diff --git a/tests/queries/0_stateless/02875_parallel_replicas_cluster_all_replicas.sql b/tests/queries/0_stateless/02875_parallel_replicas_cluster_all_replicas.sql
index 1201a156246..f59d38ceb04 100644
--- a/tests/queries/0_stateless/02875_parallel_replicas_cluster_all_replicas.sql
+++ b/tests/queries/0_stateless/02875_parallel_replicas_cluster_all_replicas.sql
@@ -2,7 +2,7 @@ DROP TABLE IF EXISTS tt;
 CREATE TABLE tt (n UInt64) ENGINE=MergeTree() ORDER BY tuple();
 INSERT INTO tt SELECT * FROM numbers(10);
 
-SET allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, use_hedged_requests=0, parallel_replicas_for_non_replicated_merge_tree=1;
+SET allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, parallel_replicas_for_non_replicated_merge_tree=1;
 SELECT count() FROM clusterAllReplicas('test_cluster_two_shard_three_replicas_localhost', currentDatabase(), tt) settings log_comment='02875_190aed82-2423-413b-ad4c-24dcca50f65b';
 
 SYSTEM FLUSH LOGS;
diff --git a/tests/queries/0_stateless/02875_parallel_replicas_remote.sql b/tests/queries/0_stateless/02875_parallel_replicas_remote.sql
index f47fc559df9..5fbaf34b621 100644
--- a/tests/queries/0_stateless/02875_parallel_replicas_remote.sql
+++ b/tests/queries/0_stateless/02875_parallel_replicas_remote.sql
@@ -2,7 +2,7 @@ DROP TABLE IF EXISTS tt;
 CREATE TABLE tt (n UInt64) ENGINE=MergeTree() ORDER BY tuple();
 INSERT INTO tt SELECT * FROM numbers(10);
 
-SET allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, use_hedged_requests=0, parallel_replicas_for_non_replicated_merge_tree=1;
+SET allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, parallel_replicas_for_non_replicated_merge_tree=1;
 SELECT count() FROM remote('127.0.0.{1..6}', currentDatabase(), tt) settings log_comment='02875_89f3c39b-1919-48cb-b66e-ef9904e73146';
 
 SYSTEM FLUSH LOGS;
diff --git a/tests/queries/0_stateless/02876_formats_with_names_dont_use_header.sh b/tests/queries/0_stateless/02876_formats_with_names_dont_use_header.sh
index ce06ff530b9..04df7f99589 100755
--- a/tests/queries/0_stateless/02876_formats_with_names_dont_use_header.sh
+++ b/tests/queries/0_stateless/02876_formats_with_names_dont_use_header.sh
@@ -8,3 +8,4 @@ echo -e "a,b,c\n1,2,3" > $CLICKHOUSE_TEST_UNIQUE_NAME.csvwithnames
 
 $CLICKHOUSE_LOCAL -q "select b from file('$CLICKHOUSE_TEST_UNIQUE_NAME.csvwithnames') settings input_format_with_names_use_header=0"
 
+rm $CLICKHOUSE_TEST_UNIQUE_NAME.csvwithnames
diff --git a/tests/queries/0_stateless/02884_parallel_window_functions.sql b/tests/queries/0_stateless/02884_parallel_window_functions.sql
index 3151b42f896..c5ab013a198 100644
--- a/tests/queries/0_stateless/02884_parallel_window_functions.sql
+++ b/tests/queries/0_stateless/02884_parallel_window_functions.sql
@@ -1,9 +1,11 @@
+-- Tags: long, no-tsan, no-asan, no-ubsan, no-msan, no-debug
+
 CREATE TABLE window_funtion_threading
 Engine = MergeTree
 ORDER BY (ac, nw)
 AS SELECT
         toUInt64(toFloat32(number % 2) % 20000000) as ac,
-        toFloat32(1) as wg,        
+        toFloat32(1) as wg,
         toUInt16(toFloat32(number % 3) % 400) as nw
 FROM numbers_mt(10000000);
 
diff --git a/tests/queries/0_stateless/02884_parallel_window_functions_bug.reference b/tests/queries/0_stateless/02884_parallel_window_functions_bug.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02884_parallel_window_functions_bug.sql b/tests/queries/0_stateless/02884_parallel_window_functions_bug.sql
new file mode 100644
index 00000000000..84bc69e2310
--- /dev/null
+++ b/tests/queries/0_stateless/02884_parallel_window_functions_bug.sql
@@ -0,0 +1,84 @@
+CREATE TABLE IF NOT EXISTS posts
+(
+    `page_id` LowCardinality(String),
+    `post_id` String CODEC(LZ4),
+    `host_id` UInt32 CODEC(T64, LZ4),
+    `path_id` UInt32,
+    `created` DateTime CODEC(T64, LZ4),
+    `as_of` DateTime CODEC(T64, LZ4)
+)
+ENGINE = ReplacingMergeTree(as_of)
+PARTITION BY toStartOfMonth(created)
+ORDER BY (page_id, post_id);
+
+CREATE TABLE IF NOT EXISTS post_metrics
+(
+    `page_id` LowCardinality(String),
+    `post_id` String CODEC(LZ4),
+    `created` DateTime CODEC(T64, LZ4),
+    `impressions` UInt32 CODEC(T64, LZ4),
+    `clicks` UInt32 CODEC(T64, LZ4),
+    `as_of` DateTime CODEC(T64, LZ4)
+)
+ENGINE = ReplacingMergeTree(as_of)
+PARTITION BY toStartOfMonth(created)
+ORDER BY (page_id, post_id);
+
+INSERT INTO posts SELECT
+    repeat('a', (number % 10) + 1),
+    toString(number),
+    number % 10,
+    number,
+    now() - toIntervalMinute(number),
+    now()
+FROM numbers(100000);
+
+INSERT INTO post_metrics SELECT
+    repeat('a', (number % 10) + 1),
+    toString(number),
+    now() - toIntervalMinute(number),
+    number * 100,
+    number * 10,
+    now()
+FROM numbers(100000);
+
+SELECT
+    host_id,
+    path_id,
+    max(rank) AS rank
+FROM
+(
+    WITH
+        as_of_posts AS
+        (
+            SELECT
+                *,
+                row_number() OVER (PARTITION BY (page_id, post_id) ORDER BY as_of DESC) AS row_num
+            FROM posts
+            WHERE (created >= subtractHours(now(), 24)) AND (host_id > 0)
+        ),
+        as_of_post_metrics AS
+        (
+            SELECT
+                *,
+                row_number() OVER (PARTITION BY (page_id, post_id) ORDER BY as_of DESC) AS row_num
+            FROM post_metrics
+            WHERE created >= subtractHours(now(), 24)
+        )
+    SELECT
+        page_id,
+        post_id,
+        host_id,
+        path_id,
+        impressions,
+        clicks,
+        ntile(20) OVER (PARTITION BY page_id ORDER BY clicks ASC ROWS BETWEEN UNBOUNDED PRECEDING AND UNBOUNDED FOLLOWING) AS rank
+    FROM as_of_posts
+    GLOBAL LEFT JOIN as_of_post_metrics USING (page_id, post_id, row_num)
+    WHERE (row_num = 1) AND (impressions > 0)
+) AS t
+WHERE t.rank > 18
+GROUP BY
+    host_id,
+    path_id
+FORMAT Null;
diff --git a/tests/queries/0_stateless/02887_insert_quorum_wo_keeper_retries.sql b/tests/queries/0_stateless/02887_insert_quorum_wo_keeper_retries.sql
index 489d25d7433..3e75d415089 100644
--- a/tests/queries/0_stateless/02887_insert_quorum_wo_keeper_retries.sql
+++ b/tests/queries/0_stateless/02887_insert_quorum_wo_keeper_retries.sql
@@ -7,6 +7,7 @@ CREATE TABLE quorum1(x UInt32) ENGINE ReplicatedMergeTree('/clickhouse/tables/{d
 CREATE TABLE quorum2(x UInt32) ENGINE ReplicatedMergeTree('/clickhouse/tables/{database}/test_02887/quorum', '2') ORDER BY x;
 
 SET insert_keeper_fault_injection_probability=0;
+SET insert_keeper_max_retries = 0;
 SET insert_quorum = 2;
 
 system enable failpoint replicated_merge_tree_insert_quorum_fail_0;
diff --git a/tests/queries/0_stateless/02888_obsolete_settings.reference b/tests/queries/0_stateless/02888_obsolete_settings.reference
index 0ef6404eabb..e2196860f4e 100644
--- a/tests/queries/0_stateless/02888_obsolete_settings.reference
+++ b/tests/queries/0_stateless/02888_obsolete_settings.reference
@@ -1,73 +1,5 @@
 -- Obsolete server settings
 -- Obsolete general settings
-allow_experimental_alter_materialized_view_structure
-allow_experimental_bigint_types
-allow_experimental_database_atomic
-allow_experimental_geo_types
-allow_experimental_map_type
-allow_experimental_query_cache
-allow_experimental_undrop_table_query
-allow_experimental_window_functions
-async_insert_cleanup_timeout_ms
-async_insert_stale_timeout_ms
-async_insert_threads
-background_buffer_flush_schedule_pool_size
-background_common_pool_size
-background_distributed_schedule_pool_size
-background_fetches_pool_size
-background_merges_mutations_concurrency_ratio
-background_message_broker_schedule_pool_size
-background_move_pool_size
-background_pool_size
-background_schedule_pool_size
-backup_threads
-database_replicated_ddl_output
-default_database_engine
-drain_timeout
-enable_debug_queries
-handle_kafka_error_mode
-input_format_arrow_import_nested
-input_format_orc_import_nested
-input_format_parquet_import_nested
-max_alter_threads
-max_memory_usage_for_all_queries
-max_pipeline_depth
-max_remote_read_network_bandwidth_for_server
-max_remote_write_network_bandwidth_for_server
-max_replicated_fetches_network_bandwidth_for_server
-max_replicated_sends_network_bandwidth_for_server
-merge_tree_clear_old_parts_interval_seconds
-merge_tree_clear_old_temporary_directories_interval_seconds
-multiple_joins_rewriter_version
-odbc_max_field_size
-optimize_duplicate_order_by_and_distinct
-optimize_fuse_sum_count_avg
-optimize_move_functions_out_of_any
-parallel_replicas_min_number_of_granules_to_enable
-partial_merge_join_optimizations
-query_cache_store_results_of_queries_with_nondeterministic_functions
-query_plan_optimize_projection
-replication_alter_columns_timeout
-restore_threads
-temporary_live_view_timeout
-use_mysql_types_in_show_columns
+1
 -- Obsolete merge tree settings
-check_delay_period
-in_memory_parts_enable_wal
-in_memory_parts_insert_sync
-max_part_loading_threads
-max_part_removal_threads
-merge_tree_clear_old_broken_detached_parts_ttl_timeout_seconds
-merge_tree_enable_clear_old_broken_detached
-min_bytes_for_compact_part
-min_relative_delay_to_yield_leadership
-min_rows_for_compact_part
-replicated_max_parallel_fetches
-replicated_max_parallel_fetches_for_table
-replicated_max_parallel_sends
-replicated_max_parallel_sends_for_table
-use_metadata_cache
-write_ahead_log_bytes_to_fsync
-write_ahead_log_interval_ms_to_fsync
-write_ahead_log_max_bytes
-write_final_mark
+1
diff --git a/tests/queries/0_stateless/02888_obsolete_settings.sql b/tests/queries/0_stateless/02888_obsolete_settings.sql
index 4d336997ad2..6e68bb1f835 100644
--- a/tests/queries/0_stateless/02888_obsolete_settings.sql
+++ b/tests/queries/0_stateless/02888_obsolete_settings.sql
@@ -2,7 +2,7 @@ SELECT '-- Obsolete server settings';
 SELECT name FROM system.server_settings WHERE is_obsolete = 1 ORDER BY name;
 
 SELECT '-- Obsolete general settings';
-SELECT name FROM system.settings WHERE is_obsolete = 1 ORDER BY name;
+SELECT count() >= 10 FROM system.settings WHERE is_obsolete = 1;
 
 SELECT '-- Obsolete merge tree settings';
-SELECT name FROM system.merge_tree_settings WHERE is_obsolete = 1 ORDER BY name;
+SELECT count() >= 10 FROM system.merge_tree_settings WHERE is_obsolete = 1;
diff --git a/tests/queries/0_stateless/02888_system_tables_with_inaccsessible_table_function.reference b/tests/queries/0_stateless/02888_system_tables_with_inaccessible_table_function.reference
similarity index 100%
rename from tests/queries/0_stateless/02888_system_tables_with_inaccsessible_table_function.reference
rename to tests/queries/0_stateless/02888_system_tables_with_inaccessible_table_function.reference
diff --git a/tests/queries/0_stateless/02888_system_tables_with_inaccsessible_table_function.sql b/tests/queries/0_stateless/02888_system_tables_with_inaccessible_table_function.sql
similarity index 100%
rename from tests/queries/0_stateless/02888_system_tables_with_inaccsessible_table_function.sql
rename to tests/queries/0_stateless/02888_system_tables_with_inaccessible_table_function.sql
diff --git a/tests/queries/0_stateless/02889_file_log_save_errors.reference b/tests/queries/0_stateless/02889_file_log_save_errors.reference
index c4a7c1f0bda..849da6ad6fa 100644
--- a/tests/queries/0_stateless/02889_file_log_save_errors.reference
+++ b/tests/queries/0_stateless/02889_file_log_save_errors.reference
@@ -1,20 +1,20 @@
-Cannot parse input: expected \'{\' before: \'Error 0\'	Error 0	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 1\'	Error 1	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 2\'	Error 2	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 3\'	Error 3	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 4\'	Error 4	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 5\'	Error 5	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 6\'	Error 6	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 7\'	Error 7	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 8\'	Error 8	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 9\'	Error 9	a.jsonl
-Cannot parse input: expected \'{\' before: \'Error 10\'	Error 10	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 11\'	Error 11	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 12\'	Error 12	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 13\'	Error 13	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 14\'	Error 14	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 15\'	Error 15	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 16\'	Error 16	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 17\'	Error 17	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 18\'	Error 18	b.jsonl
-Cannot parse input: expected \'{\' before: \'Error 19\'	Error 19	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 0\': (at row 1)\n	Error 0	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 1\': (at row 1)\n	Error 1	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 2\': (at row 1)\n	Error 2	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 3\': (at row 1)\n	Error 3	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 4\': (at row 1)\n	Error 4	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 5\': (at row 1)\n	Error 5	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 6\': (at row 1)\n	Error 6	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 7\': (at row 1)\n	Error 7	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 8\': (at row 1)\n	Error 8	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 9\': (at row 1)\n	Error 9	a.jsonl
+Cannot parse input: expected \'{\' before: \'Error 10\': (at row 1)\n	Error 10	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 11\': (at row 1)\n	Error 11	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 12\': (at row 1)\n	Error 12	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 13\': (at row 1)\n	Error 13	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 14\': (at row 1)\n	Error 14	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 15\': (at row 1)\n	Error 15	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 16\': (at row 1)\n	Error 16	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 17\': (at row 1)\n	Error 17	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 18\': (at row 1)\n	Error 18	b.jsonl
+Cannot parse input: expected \'{\' before: \'Error 19\': (at row 1)\n	Error 19	b.jsonl
diff --git a/tests/queries/0_stateless/02889_file_log_save_errors.sh b/tests/queries/0_stateless/02889_file_log_save_errors.sh
index 62f876e13db..8ef7816d57d 100755
--- a/tests/queries/0_stateless/02889_file_log_save_errors.sh
+++ b/tests/queries/0_stateless/02889_file_log_save_errors.sh
@@ -4,7 +4,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-user_files_path=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+user_files_path=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 ${CLICKHOUSE_CLIENT} --query "drop table if exists file_log;"
 ${CLICKHOUSE_CLIENT} --query "drop table if exists log_errors;"
@@ -43,4 +43,3 @@ ${CLICKHOUSE_CLIENT} --query "drop table file_log;"
 ${CLICKHOUSE_CLIENT} --query "drop table log_errors;"
 
 rm -rf ${user_files_path}/${CLICKHOUSE_TEST_UNIQUE_NAME:?}
-
diff --git a/tests/queries/0_stateless/02896_memory_accounting_for_user.sh b/tests/queries/0_stateless/02896_memory_accounting_for_user.sh
deleted file mode 100755
index f3016671420..00000000000
--- a/tests/queries/0_stateless/02896_memory_accounting_for_user.sh
+++ /dev/null
@@ -1,46 +0,0 @@
-#!/usr/bin/env bash
-# Tags: no-parallel, long, no-random-settings
-
-CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CUR_DIR"/../shell_config.sh
-
-
-total_iterations=16
-parallelism=32
-
-$CLICKHOUSE_CLIENT --query='DROP TABLE IF EXISTS test_inserts'
-$CLICKHOUSE_CLIENT --query='CREATE TABLE test_inserts ENGINE=Null AS system.numbers'
-
-run_query() {
-  ( $CLICKHOUSE_CLIENT --query='SELECT * FROM numbers_mt(1000000) FORMAT CSV' | $CLICKHOUSE_CLIENT --max_threads 8 --max_memory_usage_for_user 1073741824 -q 'INSERT INTO test_inserts FORMAT CSV' 2>/dev/null )
-}
-
-for ((i = 1; i <= total_iterations; i++)); do
-  for ((j = 1; j <= parallelism; j++)); do
-    run_query & pids+=($!)
-  done
-
-  EXIT_CODE=0
-  new_pids=()
-  for pid in "${pids[@]:0:parallelism}"; do
-    CODE=0
-    wait "${pid}" || CODE=$?
-    run_query & new_pids+=($!)
-    if [[ "${CODE}" != "0" ]]; then
-        EXIT_CODE=1;
-    fi
-  done
-  for pid in "${pids[@]:parallelism}"; do
-    CODE=0
-    wait "${pid}" || CODE=$?
-    if [[ "${CODE}" != "0" ]]; then
-        EXIT_CODE=1;
-    fi
-  done
-  pids=("${new_pids[@]}")
-
-  if [[ $EXIT_CODE -ne 0 ]]; then
-    exit $EXIT_CODE
-  fi
-done
diff --git a/tests/queries/0_stateless/02898_parallel_replicas_progress_bar.sql b/tests/queries/0_stateless/02898_parallel_replicas_progress_bar.sql
index 70a1cedf663..d8bfec12b3a 100644
--- a/tests/queries/0_stateless/02898_parallel_replicas_progress_bar.sql
+++ b/tests/queries/0_stateless/02898_parallel_replicas_progress_bar.sql
@@ -2,9 +2,9 @@ DROP TABLE IF EXISTS t1 SYNC;
 DROP TABLE IF EXISTS t2 SYNC;
 DROP TABLE IF EXISTS t3 SYNC;
 
-CREATE TABLE t1(k UInt32, v String) ENGINE ReplicatedMergeTree('/parallel_replicas/{database}/test_tbl', 'r1') ORDER BY k;
-CREATE TABLE t2(k UInt32, v String) ENGINE ReplicatedMergeTree('/parallel_replicas/{database}/test_tbl', 'r2') ORDER BY k;
-CREATE TABLE t3(k UInt32, v String) ENGINE ReplicatedMergeTree('/parallel_replicas/{database}/test_tbl', 'r3') ORDER BY k;
+CREATE TABLE t1(k UInt32, v String) ENGINE ReplicatedMergeTree('/02898_parallel_replicas/{database}/test_tbl', 'r1') ORDER BY k;
+CREATE TABLE t2(k UInt32, v String) ENGINE ReplicatedMergeTree('/02898_parallel_replicas/{database}/test_tbl', 'r2') ORDER BY k;
+CREATE TABLE t3(k UInt32, v String) ENGINE ReplicatedMergeTree('/02898_parallel_replicas/{database}/test_tbl', 'r3') ORDER BY k;
 
 insert into t1 select number, toString(number) from numbers(1000, 1000);
 insert into t2 select number, toString(number) from numbers(2000, 1000);
@@ -14,7 +14,7 @@ system sync replica t1;
 system sync replica t2;
 system sync replica t3;
 
-SET allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, use_hedged_requests=0, parallel_replicas_for_non_replicated_merge_tree=1, cluster_for_parallel_replicas='test_cluster_one_shard_three_replicas_localhost';
+SET allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, cluster_for_parallel_replicas='test_cluster_one_shard_three_replicas_localhost';
 
 -- default coordinator
 SELECT count(), min(k), max(k), avg(k) FROM t1 SETTINGS log_comment='02898_default_190aed82-2423-413b-ad4c-24dcca50f65b';
diff --git a/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.reference b/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.reference
index 4a321380536..838bf18b937 100644
--- a/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.reference
+++ b/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.reference
@@ -5,6 +5,6 @@ SELECT 1;
 DROP DATABASE foo;
 SELECT 2;
 2
-USE _local;
+USE default;
 SELECT 3;
 3
diff --git a/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.sh b/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.sh
index 1af40f8778d..3250c70a268 100755
--- a/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.sh
+++ b/tests/queries/0_stateless/02900_clickhouse_local_drop_current_database.sh
@@ -10,6 +10,6 @@ ${CLICKHOUSE_LOCAL} --echo --multiquery "
     SELECT 1;
     DROP DATABASE foo;
     SELECT 2;
-    USE _local;
+    USE default;
     SELECT 3;
 "
diff --git a/tests/queries/0_stateless/02900_union_schema_inference_mode.reference b/tests/queries/0_stateless/02900_union_schema_inference_mode.reference
new file mode 100644
index 00000000000..864cd780ddb
--- /dev/null
+++ b/tests/queries/0_stateless/02900_union_schema_inference_mode.reference
@@ -0,0 +1,33 @@
+a	Nullable(Int64)					
+obj	Tuple(f1 Nullable(Int64), f2 Nullable(String), f3 Nullable(Int64))					
+b	Nullable(Int64)					
+c	Nullable(String)					
+{"a":"1","obj":{"f1":"1","f2":"2020-01-01","f3":null},"b":null,"c":null}
+{"a":null,"obj":{"f1":null,"f2":"Some string","f3":"2"},"b":"2","c":null}
+{"a":null,"obj":{"f1":null,"f2":null,"f3":null},"b":null,"c":"hello"}
+UNION	data1.jsonl	a Nullable(Int64), obj Tuple(f1 Nullable(Int64), f2 Nullable(Date))
+UNION	data2.jsonl	b Nullable(Int64), obj Tuple(f2 Nullable(String), f3 Nullable(Int64))
+UNION	data3.jsonl	c Nullable(String)
+c	Nullable(String)					
+a	Nullable(Int64)					
+obj	Tuple(f1 Nullable(Int64), f2 Nullable(String), f3 Nullable(Int64))					
+b	Nullable(Int64)					
+c	Nullable(String)					
+a	Nullable(Int64)					
+obj	Tuple(f1 Nullable(Int64), f2 Nullable(String), f3 Nullable(Int64))					
+b	Nullable(Int64)					
+c	Nullable(String)					
+{"a":"1","obj":{"f1":"1","f2":"2020-01-01","f3":null},"b":null,"c":null}
+{"a":null,"obj":{"f1":null,"f2":"Some string","f3":"2"},"b":"2","c":null}
+{"a":null,"obj":{"f1":null,"f2":null,"f3":null},"b":null,"c":"hello"}
+UNION	archive.tar::data1.jsonl	a Nullable(Int64), obj Tuple(f1 Nullable(Int64), f2 Nullable(Date))
+UNION	archive.tar::data2.jsonl	b Nullable(Int64), obj Tuple(f2 Nullable(String), f3 Nullable(Int64))
+UNION	archive.tar::data3.jsonl	c Nullable(String)
+c	Nullable(String)					
+a	Nullable(Int64)					
+obj	Tuple(f1 Nullable(Int64), f2 Nullable(String), f3 Nullable(Int64))					
+b	Nullable(Int64)					
+c	Nullable(String)					
+1
+1
+1
diff --git a/tests/queries/0_stateless/02900_union_schema_inference_mode.sh b/tests/queries/0_stateless/02900_union_schema_inference_mode.sh
new file mode 100755
index 00000000000..dc0dd8ae1f4
--- /dev/null
+++ b/tests/queries/0_stateless/02900_union_schema_inference_mode.sh
@@ -0,0 +1,56 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-msan, no-ubsan
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+mkdir -p $CLICKHOUSE_TEST_UNIQUE_NAME
+echo '{"a" : 1, "obj" : {"f1" : 1, "f2" : "2020-01-01"}}' > $CLICKHOUSE_TEST_UNIQUE_NAME/data1.jsonl
+echo '{"b" : 2, "obj" : {"f3" : 2, "f2" : "Some string"}}' > $CLICKHOUSE_TEST_UNIQUE_NAME/data2.jsonl
+echo '{"c" : "hello"}' > $CLICKHOUSE_TEST_UNIQUE_NAME/data3.jsonl
+
+$CLICKHOUSE_LOCAL -nm -q "
+set schema_inference_mode = 'union';
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3}.jsonl');
+select * from file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3}.jsonl') order by tuple(*) format JSONEachRow;
+select schema_inference_mode, splitByChar('/', source)[-1] as file, schema from system.schema_inference_cache order by file;
+"
+
+$CLICKHOUSE_LOCAL -nm -q "
+set schema_inference_mode = 'union';
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data3.jsonl');
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3}.jsonl');
+"
+
+cd $CLICKHOUSE_TEST_UNIQUE_NAME/ && tar -cf archive.tar data1.jsonl data2.jsonl data3.jsonl && cd ..
+
+$CLICKHOUSE_LOCAL -nm -q "
+set schema_inference_mode = 'union';
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/archive.tar :: data{1,2,3}.jsonl');
+select * from file('$CLICKHOUSE_TEST_UNIQUE_NAME/archive.tar :: data{1,2,3}.jsonl') order by tuple(*) format JSONEachRow;
+select schema_inference_mode, splitByChar('/', source)[-1] as file, schema from system.schema_inference_cache order by file;
+"
+
+$CLICKHOUSE_LOCAL -nm -q "
+set schema_inference_mode = 'union';
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/archive.tar :: data3.jsonl');
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/archive.tar :: data{1,2,3}.jsonl');
+"
+
+echo 'Error' > $CLICKHOUSE_TEST_UNIQUE_NAME/data4.jsonl
+$CLICKHOUSE_LOCAL -q "desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3,4}.jsonl') settings schema_inference_mode='union'" 2>&1 | grep -c -F "Cannot extract table structure"
+
+$CLICKHOUSE_LOCAL -nm -q "
+set schema_inference_mode = 'union';
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{2,3}.jsonl');
+desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2,3,4}.jsonl');
+" 2>&1 | grep -c -F "Cannot extract table structure"
+
+echo 42 > $CLICKHOUSE_TEST_UNIQUE_NAME/data1.csv
+echo 42, 43 > $CLICKHOUSE_TEST_UNIQUE_NAME/data2.csv
+
+$CLICKHOUSE_LOCAL -q "desc file('$CLICKHOUSE_TEST_UNIQUE_NAME/data{1,2}.csv') settings schema_inference_mode='union'" 2>&1 | grep -c -F "BAD_ARGUMENTS";
+
+rm -rf ${CLICKHOUSE_TEST_UNIQUE_NAME}
+
diff --git a/tests/queries/0_stateless/02901_parallel_replicas_rollup.sh b/tests/queries/0_stateless/02901_parallel_replicas_rollup.sh
index f23b80348c1..029b4d07ee2 100755
--- a/tests/queries/0_stateless/02901_parallel_replicas_rollup.sh
+++ b/tests/queries/0_stateless/02901_parallel_replicas_rollup.sh
@@ -29,8 +29,7 @@ $CLICKHOUSE_CLIENT \
   --query_id "${query_id}" \
   --max_parallel_replicas 3 \
   --prefer_localhost_replica 1 \
-  --use_hedged_requests 0 \
-  --cluster_for_parallel_replicas "parallel_replicas" \
+  --cluster_for_parallel_replicas "test_cluster_one_shard_three_replicas_localhost" \
   --allow_experimental_parallel_reading_from_replicas 1 \
   --parallel_replicas_for_non_replicated_merge_tree 1 \
   --parallel_replicas_min_number_of_rows_per_replica 0 \
@@ -63,8 +62,7 @@ $CLICKHOUSE_CLIENT \
   --query_id "${query_id}" \
   --max_parallel_replicas 3 \
   --prefer_localhost_replica 1 \
-  --use_hedged_requests 0 \
-  --cluster_for_parallel_replicas "parallel_replicas" \
+  --cluster_for_parallel_replicas "test_cluster_one_shard_three_replicas_localhost" \
   --allow_experimental_parallel_reading_from_replicas 1 \
   --parallel_replicas_for_non_replicated_merge_tree 1 \
   --parallel_replicas_min_number_of_rows_per_replica 0 \
diff --git a/tests/queries/0_stateless/02905_system_logs_hostname.reference b/tests/queries/0_stateless/02905_system_logs_hostname.reference
new file mode 100644
index 00000000000..ea10927888b
--- /dev/null
+++ b/tests/queries/0_stateless/02905_system_logs_hostname.reference
@@ -0,0 +1 @@
+test hostname in system log tables
diff --git a/tests/queries/0_stateless/02905_system_logs_hostname.sql b/tests/queries/0_stateless/02905_system_logs_hostname.sql
new file mode 100644
index 00000000000..aa7a73a5edc
--- /dev/null
+++ b/tests/queries/0_stateless/02905_system_logs_hostname.sql
@@ -0,0 +1,26 @@
+SELECT 'test hostname in system log tables';
+
+set log_query_threads=1;
+set log_queries_min_type='QUERY_FINISH';
+set log_queries=1;
+select '02095_system_logs_hostname' from system.one format Null;
+set log_queries=0;
+set log_query_threads=0;
+
+system flush logs;
+
+select hostname
+from system.query_log
+where
+    query like 'select \'02095_system_logs_hostname%'
+    and current_database = currentDatabase()
+    and event_date >= yesterday() LIMIT 1 FORMAT Null;
+
+
+select hostName(), hostname
+from system.query_thread_log
+where
+    query like 'select \'02095_system_logs_hostname%'
+    and current_database = currentDatabase()
+    and event_date >= yesterday() LIMIT 1 FORMAT Null;
+
diff --git a/tests/queries/0_stateless/02906_flatten_only_true_nested.reference b/tests/queries/0_stateless/02906_flatten_only_true_nested.reference
new file mode 100644
index 00000000000..e7a96da8db9
--- /dev/null
+++ b/tests/queries/0_stateless/02906_flatten_only_true_nested.reference
@@ -0,0 +1,3 @@
+data.x	Array(UInt32)					
+data.y	Array(UInt32)					
+data	Array(Tuple(x UInt64, y UInt64))					
diff --git a/tests/queries/0_stateless/02906_flatten_only_true_nested.sql b/tests/queries/0_stateless/02906_flatten_only_true_nested.sql
new file mode 100644
index 00000000000..e930b46bd70
--- /dev/null
+++ b/tests/queries/0_stateless/02906_flatten_only_true_nested.sql
@@ -0,0 +1,9 @@
+set flatten_nested = 1;
+drop table if exists test_nested;
+create table test_nested (data Nested(x UInt32, y UInt32)) engine=Memory;
+desc test_nested;
+drop table test_nested;
+drop table if exists test_array_tuple;
+create table test_array_tuple (data Array(Tuple(x UInt64, y UInt64))) engine=Memory;
+desc test_array_tuple;
+drop table test_array_tuple;
diff --git a/tests/queries/0_stateless/02906_force_optimize_projection_name.sql b/tests/queries/0_stateless/02906_force_optimize_projection_name.sql
index 773f8cc514d..952ef8178b7 100644
--- a/tests/queries/0_stateless/02906_force_optimize_projection_name.sql
+++ b/tests/queries/0_stateless/02906_force_optimize_projection_name.sql
@@ -8,7 +8,8 @@ CREATE TABLE test
    )
 )
 ENGINE = MergeTree()
-ORDER BY id;
+ORDER BY id
+SETTINGS index_granularity_bytes = 10000;
 
 INSERT INTO test SELECT number, 'test' FROM numbers(1, 100);
 
diff --git a/tests/queries/0_stateless/02908_filesystem_cache_as_collection.reference b/tests/queries/0_stateless/02908_filesystem_cache_as_collection.reference
index 64c8d3a0b68..90c5e0e99a5 100644
--- a/tests/queries/0_stateless/02908_filesystem_cache_as_collection.reference
+++ b/tests/queries/0_stateless/02908_filesystem_cache_as_collection.reference
@@ -1,2 +1,2 @@
-1048576	10000000	33554432	4194304	0	0	0	0	/var/lib/clickhouse/filesystem_caches/collection_sql	5	5000	0	1
-1048576	10000000	33554432	4194304	0	0	0	0	/var/lib/clickhouse/filesystem_caches/collection	5	5000	0	1
+1048576	10000000	33554432	4194304	0	0	0	0	/var/lib/clickhouse/filesystem_caches/collection_sql	5	5000	0	16
+1048576	10000000	33554432	4194304	0	0	0	0	/var/lib/clickhouse/filesystem_caches/collection	5	5000	0	16
diff --git a/tests/queries/0_stateless/02910_replicated_merge_parameters_must_consistent.reference b/tests/queries/0_stateless/02910_replicated_merge_parameters_must_consistent.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02910_replicated_merge_parameters_must_consistent.sql b/tests/queries/0_stateless/02910_replicated_merge_parameters_must_consistent.sql
new file mode 100644
index 00000000000..3c1bec4fb3f
--- /dev/null
+++ b/tests/queries/0_stateless/02910_replicated_merge_parameters_must_consistent.sql
@@ -0,0 +1,80 @@
+-- Tags: zookeeper, no-replicated-database
+CREATE TABLE t
+(
+    `id` UInt64,
+    `val` String,
+    `legacy_ver` UInt64,
+)
+ENGINE = ReplicatedReplacingMergeTree('/tables/{database}/t/', 'r1', legacy_ver)
+ORDER BY id;
+
+CREATE TABLE t_r
+(
+    `id` UInt64,
+    `val` String,
+    `legacy_ver` UInt64
+)
+ENGINE = ReplicatedReplacingMergeTree('/tables/{database}/t/', 'r2')
+ORDER BY id; -- { serverError METADATA_MISMATCH }
+
+CREATE TABLE t2
+(
+    `id` UInt64,
+    `val` String,
+    `legacy_ver` UInt64,
+    `deleted` UInt8
+)
+ENGINE = ReplicatedReplacingMergeTree('/tables/{database}/t2/', 'r1', legacy_ver)
+ORDER BY id;
+
+CREATE TABLE t2_r
+(
+    `id` UInt64,
+    `val` String,
+    `legacy_ver` UInt64,
+    `deleted` UInt8
+)
+ENGINE = ReplicatedReplacingMergeTree('/tables/{database}/t2/', 'r2', legacy_ver, deleted)
+ORDER BY id; -- { serverError METADATA_MISMATCH }
+
+CREATE TABLE t3
+(
+    `key` UInt64,
+    `metrics1` UInt64,
+    `metrics2` UInt64
+)
+ENGINE = ReplicatedSummingMergeTree('/tables/{database}/t3/', 'r1', metrics1)
+ORDER BY key;
+
+CREATE TABLE t3_r
+(
+    `key` UInt64,
+    `metrics1` UInt64,
+    `metrics2` UInt64
+)
+ENGINE = ReplicatedSummingMergeTree('/tables/{database}/t3/', 'r2', metrics2)
+ORDER BY key; -- { serverError METADATA_MISMATCH }
+
+CREATE TABLE t4
+(
+    `key` UInt32,
+    `Path` String,
+    `Time` DateTime('UTC'),
+    `Value` Float64,
+    `Version` UInt32,
+    `col` UInt64
+)
+ENGINE = ReplicatedGraphiteMergeTree('/tables/{database}/t4/', 'r1', 'graphite_rollup')
+ORDER BY key;
+
+CREATE TABLE t4_r
+(
+    `key` UInt32,
+    `Path` String,
+    `Time` DateTime('UTC'),
+    `Value` Float64,
+    `Version` UInt32,
+    `col` UInt64
+)
+ENGINE = ReplicatedGraphiteMergeTree('/tables/{database}/t4/', 'r2', 'graphite_rollup_alternative')
+ORDER BY key; -- { serverError METADATA_MISMATCH }
diff --git a/tests/queries/0_stateless/02910_replicated_with_simple_aggregate_column.sql b/tests/queries/0_stateless/02910_replicated_with_simple_aggregate_column.sql
deleted file mode 100644
index 84250059c58..00000000000
--- a/tests/queries/0_stateless/02910_replicated_with_simple_aggregate_column.sql
+++ /dev/null
@@ -1,17 +0,0 @@
-CREATE TABLE t_r1
-(
-    `id` UInt64,
-    `val` SimpleAggregateFunction(max, Nullable(String))
-)
-ENGINE = ReplicatedAggregatingMergeTree('/tables/{database}/t', 'r1')
-ORDER BY id
-SETTINGS index_granularity = 8192;
-
-CREATE TABLE t_r2
-(
-    `id` UInt64,
-    `val` SimpleAggregateFunction(anyLast, Nullable(String))
-)
-ENGINE = ReplicatedAggregatingMergeTree('/tables/{database}/t', 'r2')
-ORDER BY id
-SETTINGS index_granularity = 8192; -- { serverError INCOMPATIBLE_COLUMNS }
diff --git a/tests/queries/0_stateless/02911_getHTTPHeaderFuncion.reference b/tests/queries/0_stateless/02911_getHTTPHeaderFuncion.reference
deleted file mode 100644
index 61effdb19c4..00000000000
--- a/tests/queries/0_stateless/02911_getHTTPHeaderFuncion.reference
+++ /dev/null
@@ -1,13 +0,0 @@
-value
-value1	value2
-value1	value1	value2
-NOT-FOUND-KEY is not in HTTP request headers
-FORBIDDEN-KEY1 is in get_client_http_header_forbidden_headers
-1	row1_value1	row1_value2	row1_value3	row1_value4	row1_value5	row1_value6	row1_value7
-2	row2_value1	row2_value2	row2_value3	row2_value4	row2_value5	row2_value6	row2_value7
-3							
-value_from_query_1	value_from_query_2	value_from_query_3	1	row1_value1	row1_value2	row1_value3	row1_value4	row1_value5	row1_value6	row1_value7
-value_from_query_1	value_from_query_2	value_from_query_3	2	row2_value1	row2_value2	row2_value3	row2_value4	row2_value5	row2_value6	row2_value7
-value_from_query_1	value_from_query_2	value_from_query_3	3							
-http_value1
-http_value2
diff --git a/tests/queries/0_stateless/02911_getHTTPHeaderFuncion.sh b/tests/queries/0_stateless/02911_getHTTPHeaderFuncion.sh
deleted file mode 100755
index 505e017ee5d..00000000000
--- a/tests/queries/0_stateless/02911_getHTTPHeaderFuncion.sh
+++ /dev/null
@@ -1,75 +0,0 @@
-#!/usr/bin/env bash
-
-CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CUR_DIR"/../shell_config.sh
-
-echo "SELECT getClientHTTPHeader('key')" | curl -s -H 'X-ClickHouse-User: default' -H 'X-ClickHouse-Key: ' -H 'key: value' 'http://localhost:8123/' -d @-  
-
-echo "SELECT getClientHTTPHeader('key1'), getClientHTTPHeader('key2')" | curl -s -H 'X-Clickhouse-User: default' \
-    -H 'X-ClickHouse-Key: ' -H 'key1: value1' -H 'key2: value2' 'http://localhost:8123/' -d @-
-
-echo "SELECT getClientHTTPHeader('test-' || 'key' || '-1'), getClientHTTPHeader('test-key-1'), getClientHTTPHeader('key2')" | curl -s -H 'X-Clickhouse-User: default' \
-    -H 'X-ClickHouse-Key: ' -H 'test-key-1: value1' -H 'key2: value2' 'http://localhost:8123/' -d @-
-
-#Code: 36. DB::Exception: NOT-FOUND-KEY is not in HTTP request headers
-echo "SELECT getClientHTTPHeader('NOT-FOUND-KEY')"| curl -s -H 'X-Clickhouse-User: default' \
-    -H 'X-ClickHouse-Key: ' -H 'key1: value1' -H 'key2: value2' 'http://localhost:8123/' -d @- | grep -o -e "NOT-FOUND-KEY is not in HTTP request headers" 
-
-#Code: 36. DB::Exception: The header FORBIDDEN-KEY is in headers_forbidden_to_return, you can config it in config file.
-echo "SELECT getClientHTTPHeader('FORBIDDEN-KEY1')" | curl -s -H 'X-ClickHouse-User: default' -H 'X-ClickHouse-Key: ' \
-    -H 'FORBIDDEN-KEY1: forbbiden1' 'http://localhost:8123/' -d @- | grep -o -e "FORBIDDEN-KEY1 is in get_client_http_header_forbidden_headers"
-
-db_name=${CLICKHOUSE_DATABASE}
-
-$CLICKHOUSE_CLIENT -q "CREATE DATABASE IF NOT EXISTS ${db_name};"
-
-$CLICKHOUSE_CLIENT -q "CREATE TABLE ${db_name}.02884_get_http_header
-     (id UInt32, 
-     http_key1 String DEFAULT getClientHTTPHeader('http_header_key1'),
-     http_key2 String DEFAULT getClientHTTPHeader('http_header_key2'),
-     http_key3 String DEFAULT getClientHTTPHeader('http_header_key3'),
-     http_key4 String DEFAULT getClientHTTPHeader('http_header_key4'),
-     http_key5 String DEFAULT getClientHTTPHeader('http_header_key5'),
-     http_key6 String DEFAULT getClientHTTPHeader('http_header_key6'),
-     http_key7 String DEFAULT getClientHTTPHeader('http_header_key7')
-     ) 
-     Engine=MergeTree()
-     ORDER BY id" 
-
-#Insert data via http request
-echo "INSERT INTO ${db_name}.02884_get_http_header (id) values (1)" | curl -s -H 'X-ClickHouse-User: default' -H 'X-ClickHouse-Key: ' \
- -H 'http_header_key1: row1_value1'\
- -H 'http_header_key2: row1_value2'\
- -H 'http_header_key3: row1_value3'\
- -H 'http_header_key4: row1_value4'\
- -H 'http_header_key5: row1_value5'\
- -H 'http_header_key6: row1_value6'\
- -H 'http_header_key7: row1_value7' 'http://localhost:8123/' -d @-
-
-echo "INSERT INTO ${db_name}.02884_get_http_header (id) values (2)" | curl -s -H 'X-ClickHouse-User: default' -H 'X-ClickHouse-Key: ' \
- -H 'http_header_key1: row2_value1'\
- -H 'http_header_key2: row2_value2'\
- -H 'http_header_key3: row2_value3'\
- -H 'http_header_key4: row2_value4'\
- -H 'http_header_key5: row2_value5'\
- -H 'http_header_key6: row2_value6'\
- -H 'http_header_key7: row2_value7' 'http://localhost:8123/' -d @-
-
-$CLICKHOUSE_CLIENT -q "SELECT id, http_key1, http_key2, http_key3, http_key4, http_key5, http_key6, http_key7 FROM ${db_name}.02884_get_http_header ORDER BY id;"
-#Insert data via tcp client
-$CLICKHOUSE_CLIENT --param_db="$db_name" -q "INSERT INTO ${db_name}.02884_get_http_header (id) values (3)"
-$CLICKHOUSE_CLIENT --param_db="$db_name" -q "SELECT * FROM ${db_name}.02884_get_http_header where id = 3"
-
-echo "SELECT getClientHTTPHeader('key_from_query_1'), getClientHTTPHeader('key_from_query_2'), getClientHTTPHeader('key_from_query_3'), * FROM ${db_name}.02884_get_http_header ORDER BY id" | curl -s -H 'X-Clickhouse-User: default' \
-    -H 'X-ClickHouse-Key: ' -H 'key_from_query_1: value_from_query_1' -H 'key_from_query_2: value_from_query_2' -H 'key_from_query_3: value_from_query_3' 'http://localhost:8123/' -d @-
-
-$CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS ${db_name}.02884_get_http_header"
-
-$CLICKHOUSE_CLIENT -q "CREATE TABLE IF NOT EXISTS ${db_name}.02884_header_from_table (header_name String) Engine=Memory"
-$CLICKHOUSE_CLIENT -q "INSERT INTO ${db_name}.02884_header_from_table values ('http_key1'), ('http_key2')"
-
-echo "SELECT getClientHTTPHeader(header_name) as value from  (select * FROM ${db_name}.02884_header_from_table) order by value" | curl -s -H 'X-Clickhouse-User: default' \
-    -H 'X-ClickHouse-Key: ' -H 'http_key1: http_value1' -H 'http_key2: http_value2' 'http://localhost:8123/' -d @-
-
-$CLICKHOUSE_CLIENT -q "DROP DATABASE ${db_name}"
diff --git a/tests/queries/0_stateless/02911_support_alias_column_in_indices.sql b/tests/queries/0_stateless/02911_support_alias_column_in_indices.sql
index 93d9a1670db..46d91534339 100644
--- a/tests/queries/0_stateless/02911_support_alias_column_in_indices.sql
+++ b/tests/queries/0_stateless/02911_support_alias_column_in_indices.sql
@@ -9,7 +9,10 @@ create table test1
     c UInt32,
     a alias c + 1,
     index i (a) type minmax
-) engine = MergeTree order by c;
+)
+engine = MergeTree
+order by c
+settings index_granularity = 8192, min_index_granularity_bytes = 1024, index_granularity_bytes = 10485760; -- default settings, prevent randomization in tests
 
 insert into test1 select * from numbers(10);
 insert into test1 select * from numbers(11, 20);
@@ -23,7 +26,10 @@ create table test2
     a1 alias c + 1,
     a2 alias a1 + 1,
     index i (a2) type minmax
-) engine = MergeTree order by c;
+)
+engine = MergeTree
+order by c
+settings index_granularity = 8192, min_index_granularity_bytes = 1024, index_granularity_bytes = 10485760; -- default settings, prevent randomization in tests
 
 insert into test2 select * from numbers(10);
 insert into test2 select * from numbers(11, 20);
diff --git a/tests/queries/0_stateless/02916_csv_infer_numbers_from_strings.reference b/tests/queries/0_stateless/02916_csv_infer_numbers_from_strings.reference
new file mode 100644
index 00000000000..f64557f1b70
--- /dev/null
+++ b/tests/queries/0_stateless/02916_csv_infer_numbers_from_strings.reference
@@ -0,0 +1,6 @@
+c1	Nullable(Int64)					
+c2	Nullable(Float64)					
+c3	Nullable(Bool)					
+c1	Nullable(String)					
+c2	Nullable(String)					
+c3	Nullable(String)					
diff --git a/tests/queries/0_stateless/02916_csv_infer_numbers_from_strings.sql b/tests/queries/0_stateless/02916_csv_infer_numbers_from_strings.sql
new file mode 100644
index 00000000000..713d3d7190c
--- /dev/null
+++ b/tests/queries/0_stateless/02916_csv_infer_numbers_from_strings.sql
@@ -0,0 +1,4 @@
+set input_format_csv_try_infer_numbers_from_strings=1;
+desc format(CSV, '"42","42.42","True"');
+desc format(CSV, '"42","42.42","True"\n"abc","def","ghk"');
+
diff --git a/tests/queries/0_stateless/02916_dictionary_access.reference b/tests/queries/0_stateless/02916_dictionary_access.reference
new file mode 100644
index 00000000000..d7d02e37689
--- /dev/null
+++ b/tests/queries/0_stateless/02916_dictionary_access.reference
@@ -0,0 +1,3 @@
+0
+ACCESS_DENIED
+ACCESS_DENIED
diff --git a/tests/queries/0_stateless/02916_dictionary_access.sh b/tests/queries/0_stateless/02916_dictionary_access.sh
new file mode 100755
index 00000000000..08ee517ab3b
--- /dev/null
+++ b/tests/queries/0_stateless/02916_dictionary_access.sh
@@ -0,0 +1,37 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+username="user_${CLICKHOUSE_TEST_UNIQUE_NAME}"
+dictname="dict_${CLICKHOUSE_TEST_UNIQUE_NAME}"
+
+${CLICKHOUSE_CLIENT} -nm --query "
+    CREATE DICTIONARY IF NOT EXISTS ${dictname}
+    (
+        id UInt64,
+        value UInt64
+    )
+    PRIMARY KEY id
+    SOURCE(NULL())
+    LAYOUT(FLAT())
+    LIFETIME(MIN 0 MAX 1000);
+    CREATE USER IF NOT EXISTS ${username} NOT IDENTIFIED;
+    GRANT CREATE TEMPORARY TABLE ON *.* to ${username};
+    SELECT * FROM dictionary(${dictname});
+    SELECT dictGet(${dictname}, 'value', 1);
+"
+
+$CLICKHOUSE_CLIENT -nm --user="${username}" --query "
+    SELECT * FROM dictionary(${dictname});
+" 2>&1 | grep -o ACCESS_DENIED | uniq
+
+$CLICKHOUSE_CLIENT -nm --user="${username}" --query "
+    SELECT dictGet(${dictname}, 'value', 1);
+" 2>&1 | grep -o ACCESS_DENIED | uniq
+
+${CLICKHOUSE_CLIENT} -nm --query "
+    DROP DICTIONARY IF EXISTS ${dictname};
+    DROP USER IF EXISTS ${username};
+"
diff --git a/tests/queries/0_stateless/02916_distributed_skip_unavailable_shards.reference b/tests/queries/0_stateless/02916_distributed_skip_unavailable_shards.reference
new file mode 100644
index 00000000000..77fc99a2f2f
--- /dev/null
+++ b/tests/queries/0_stateless/02916_distributed_skip_unavailable_shards.reference
@@ -0,0 +1 @@
+1234	abcd	1
diff --git a/tests/queries/0_stateless/02916_distributed_skip_unavailable_shards.sql b/tests/queries/0_stateless/02916_distributed_skip_unavailable_shards.sql
new file mode 100644
index 00000000000..48a1294982d
--- /dev/null
+++ b/tests/queries/0_stateless/02916_distributed_skip_unavailable_shards.sql
@@ -0,0 +1,28 @@
+-- Tags: shard, no-fasttest
+
+DROP TABLE IF EXISTS table_02916;
+DROP TABLE IF EXISTS table_02916_distributed;
+
+CREATE TABLE table_02916
+(
+    `ID` UInt32,
+    `Name` String
+)
+ENGINE = MergeTree
+ORDER BY ID;
+
+INSERT INTO table_02916 VALUES (1234, 'abcd');
+
+CREATE TABLE table_02916_distributed
+(
+    `ID` UInt32,
+    `Name` String
+)
+ENGINE = Distributed(test_unavailable_shard, currentDatabase(), table_02916, rand())
+SETTINGS skip_unavailable_shards = 1;
+
+SET send_logs_level='fatal';
+SELECT *, _shard_num FROM table_02916_distributed;
+
+DROP TABLE table_02916_distributed;
+DROP TABLE table_02916;
diff --git a/tests/queries/0_stateless/02918_fuzzjson_table_function.reference b/tests/queries/0_stateless/02918_fuzzjson_table_function.reference
index 1b5c6f46f77..8ad9e886b49 100644
--- a/tests/queries/0_stateless/02918_fuzzjson_table_function.reference
+++ b/tests/queries/0_stateless/02918_fuzzjson_table_function.reference
@@ -150,3 +150,4 @@
 {}
 730
 200
+50
diff --git a/tests/queries/0_stateless/02918_fuzzjson_table_function.sql b/tests/queries/0_stateless/02918_fuzzjson_table_function.sql
index 6db0c69dbac..398b3572587 100644
--- a/tests/queries/0_stateless/02918_fuzzjson_table_function.sql
+++ b/tests/queries/0_stateless/02918_fuzzjson_table_function.sql
@@ -92,15 +92,70 @@ SELECT * FROM fuzzJSON(02918_json_fuzzer, max_key_length=10, min_key_length=0) L
 SELECT * FROM fuzzJSON(02918_json_fuzzer, max_key_length=10, min_key_length=11) LIMIT 10; -- { serverError BAD_ARGUMENTS }
 
 --
-DROP TABLE IF EXISTS 02918_table_obj;
-CREATE TABLE 02918_table_obj (json_obj Object('json')) Engine=Memory;
+DROP TABLE IF EXISTS 02918_table_obj1;
+CREATE TABLE 02918_table_obj1 (json_obj Object('json')) Engine=Memory;
 
-INSERT INTO 02918_table_obj SELECT * FROM fuzzJSON(
+INSERT INTO 02918_table_obj1 SELECT * FROM fuzzJSON(
     02918_json_fuzzer,
     json_str='{"name": "John Doe", "age": 27, "address": {"city": "Citiville", "zip": "12345"}, "hobbies": ["reading", "traveling", "coding"]}',
     random_seed=12345) LIMIT 200;
-SELECT count() FROM 02918_table_obj;
 
-DROP TABLE IF EXISTS 02918_table_obj;
+SELECT count() FROM 02918_table_obj1;
+
+DROP TABLE IF EXISTS 02918_table_obj1;
+
+--
+DROP TABLE IF EXISTS 02918_table_obj2;
+CREATE TABLE 02918_table_obj2 (json_obj Object('json')) Engine=Memory;
+
+INSERT INTO 02918_table_obj2 SELECT * FROM fuzzJSON(
+    02918_json_fuzzer,
+    json_str=
+    '{
+      "name": {
+        "first": "Joan",
+        "last": "of Arc"
+      },
+      "birth": {"date": "January 6, 1412", "place": "Domremy, France"},
+      "death": {"date": "May 30, 1431", "place": "Rouen, France"},
+      "occupation": "Military Leader",
+      "achievements": ["Lifted Siege of Orleans", "Assisted in Charles VII\'s Coronation"],
+      "legacy": {
+        "honors": ["Canonized Saint", "National Heroine of France"],
+        "memorials": [
+        {"name": "Joan of Arc Memorial", "location": "Domremy"},
+        {"name": "Place Jeanne d\'Arc", "location": "Rouen"}
+        ]
+      }
+    }',
+    random_seed=12345,
+    max_output_length=1024) LIMIT 50;
+
+INSERT INTO 02918_table_obj2 SELECT * FROM fuzzJSON(
+    02918_json_fuzzer,
+    json_str=
+    '{
+      "name": {
+        "first": "Joan",
+        "last": "of Arc"
+      },
+      "birth": {"date": "January 6, 1412", "place": "Domremy, France"},
+      "death": {"date": "May 30, 1431", "place": "Rouen, France"},
+      "occupation": "Military Leader",
+      "achievements": ["Lifted Siege of Orleans", "Assisted in Charles VII\'s Coronation"],
+      "legacy": {
+        "honors": ["Canonized Saint", "National Heroine of France"],
+        "memorials": [
+        {"name": "Joan of Arc Memorial", "location": "Domremy"},
+        {"name": "Place Jeanne d\'Arc", "location": "Rouen"}
+        ]
+      }
+    }',
+    random_seed=12345,
+    max_output_length=1024, malform_output=true) LIMIT 50; -- {serverError INCORRECT_DATA }
+
+SELECT count() FROM 02918_table_obj2;
+
+DROP TABLE IF EXISTS 02918_table_obj2;
 
 DROP NAMED COLLECTION IF EXISTS 02918_json_fuzzer;
diff --git a/tests/queries/0_stateless/02918_optimize_count_for_merge_tables.reference b/tests/queries/0_stateless/02918_optimize_count_for_merge_tables.reference
new file mode 100644
index 00000000000..3f5700b6d63
--- /dev/null
+++ b/tests/queries/0_stateless/02918_optimize_count_for_merge_tables.reference
@@ -0,0 +1,9 @@
+2
+Expression ((Projection + Before ORDER BY))
+  MergingAggregated
+    ReadFromPreparedSource (Optimized trivial count)
+3
+Expression ((Projection + Before ORDER BY))
+  Aggregating
+    Expression (Before GROUP BY)
+      ReadFromMerge
diff --git a/tests/queries/0_stateless/02918_optimize_count_for_merge_tables.sql b/tests/queries/0_stateless/02918_optimize_count_for_merge_tables.sql
new file mode 100644
index 00000000000..9feb2aa2ad6
--- /dev/null
+++ b/tests/queries/0_stateless/02918_optimize_count_for_merge_tables.sql
@@ -0,0 +1,32 @@
+-- Tests that Merge-engine (not: MergeTree!) tables support the trivial count
+-- optimization if all underlying tables support it
+
+DROP TABLE IF EXISTS mt1;
+DROP TABLE IF EXISTS mt2;
+DROP TABLE IF EXISTS merge;
+
+CREATE TABLE mt1 (id UInt64) ENGINE = MergeTree ORDER BY id;
+CREATE TABLE mt2 (id UInt64) ENGINE = MergeTree ORDER BY id;
+CREATE TABLE merge (id UInt64) ENGINE = Merge(currentDatabase(), '^mt[0-9]+$');
+
+INSERT INTO mt1 VALUES (1);
+INSERT INTO mt2 VALUES (1);
+
+SELECT count() FROM merge;
+
+-- can use the trivial count optimization
+EXPLAIN SELECT count() FROM merge settings allow_experimental_analyzer=0;
+
+CREATE TABLE mt3 (id UInt64) ENGINE = TinyLog;
+
+INSERT INTO mt2 VALUES (2);
+
+SELECT count() FROM merge;
+
+-- can't use the trivial count optimization as TinyLog doesn't support it
+EXPLAIN SELECT count() FROM merge settings allow_experimental_analyzer=0;
+
+DROP TABLE IF EXISTS mt1;
+DROP TABLE IF EXISTS mt2;
+DROP TABLE IF EXISTS mt3;
+DROP TABLE IF EXISTS merge;
diff --git a/tests/queries/0_stateless/02918_template_format_deadlock.reference b/tests/queries/0_stateless/02918_template_format_deadlock.reference
new file mode 100644
index 00000000000..83f5da32cc7
--- /dev/null
+++ b/tests/queries/0_stateless/02918_template_format_deadlock.reference
@@ -0,0 +1 @@
+42	43
diff --git a/tests/queries/0_stateless/02918_template_format_deadlock.sh b/tests/queries/0_stateless/02918_template_format_deadlock.sh
new file mode 100755
index 00000000000..344a8b55b0d
--- /dev/null
+++ b/tests/queries/0_stateless/02918_template_format_deadlock.sh
@@ -0,0 +1,19 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+DATA_FILE=$CLICKHOUSE_TEST_UNIQUE_NAME
+TEMPLATE_FILE=$CLICKHOUSE_TEST_UNIQUE_NAME.template
+
+echo "42 | 43
+Error line" > $DATA_FILE
+echo '${a:CSV} | ${b:CSV}' > $TEMPLATE_FILE
+
+$CLICKHOUSE_LOCAL -q "select * from file('$DATA_FILE', Template, 'a UInt32, b UInt32') settings format_template_row='$TEMPLATE_FILE', input_format_allow_errors_num=1"
+
+rm $DATA_FILE
+rm $TEMPLATE_FILE
+
diff --git a/tests/queries/0_stateless/02919_insert_meet_eternal_hardware_error.reference b/tests/queries/0_stateless/02919_insert_meet_eternal_hardware_error.reference
new file mode 100644
index 00000000000..a9463b5a7b0
--- /dev/null
+++ b/tests/queries/0_stateless/02919_insert_meet_eternal_hardware_error.reference
@@ -0,0 +1 @@
+[1,2,3,4,5,6,7,8,9,10,11,12,13,14,15]
diff --git a/tests/queries/0_stateless/02919_insert_meet_eternal_hardware_error.sql b/tests/queries/0_stateless/02919_insert_meet_eternal_hardware_error.sql
new file mode 100644
index 00000000000..05602b42c6a
--- /dev/null
+++ b/tests/queries/0_stateless/02919_insert_meet_eternal_hardware_error.sql
@@ -0,0 +1,26 @@
+-- Tags: zookeeper, no-parallel
+
+DROP TABLE IF EXISTS t_hardware_error NO DELAY;
+
+CREATE TABLE t_hardware_error (
+    KeyID UInt32
+) Engine = ReplicatedMergeTree('/clickhouse/tables/{shard}/{database}/t_async_insert_dedup', '{replica}')
+ORDER BY (KeyID);
+
+insert into t_hardware_error values (1), (2), (3), (4), (5);
+
+-- Data is written to ZK but the connection fails right after and we can't recover it
+system enable failpoint replicated_merge_tree_commit_zk_fail_after_op;
+system enable failpoint replicated_merge_tree_commit_zk_fail_when_recovering_from_hw_fault;
+
+insert into t_hardware_error values (6), (7), (8), (9), (10); -- {serverError UNKNOWN_STATUS_OF_INSERT}
+
+system disable failpoint replicated_commit_zk_fail_after_op;
+system disable failpoint replicated_merge_tree_commit_zk_fail_when_recovering_from_hw_fault;
+
+insert into t_hardware_error values (11), (12), (13), (14), (15);
+
+-- All 3 commits have been written correctly. The unknown status is ok (since it failed after the operation)
+Select arraySort(groupArray(KeyID)) FROM t_hardware_error;
+
+DROP TABLE t_hardware_error NO DELAY;
diff --git a/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.reference b/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.reference
new file mode 100644
index 00000000000..4b4c9812f09
--- /dev/null
+++ b/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.reference
@@ -0,0 +1,4 @@
+42
+100000
+42
+100000
diff --git a/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.sh b/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.sh
new file mode 100755
index 00000000000..7ddb55fb39b
--- /dev/null
+++ b/tests/queries/0_stateless/02919_skip_lots_of_parsing_errors.sh
@@ -0,0 +1,23 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-cpu-aarch64
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+FILE=$CLICKHOUSE_TEST_UNIQUE_NAME
+ERRORS_FILE=$CLICKHOUSE_TEST_UNIQUE_NAME.errors
+
+$CLICKHOUSE_LOCAL -q "select 'Error' from numbers(100000) format TSVRaw" > $FILE
+echo -e "42" >> $FILE
+
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE', CSV, 'x UInt32') settings input_format_allow_errors_ratio=1, max_block_size=10000, input_format_parallel_parsing=0, input_format_record_errors_file_path='$ERRORS_FILE'";
+$CLICKHOUSE_LOCAL -q "select count() from file('$ERRORS_FILE', CSV)"
+rm $ERRORS_FILE
+
+$CLICKHOUSE_LOCAL -q "select * from file('$FILE', CSV, 'x UInt32') settings input_format_allow_errors_ratio=1, max_block_size=10000, input_format_parallel_parsing=1, input_format_record_errors_file_path='$ERRORS_FILE'";
+$CLICKHOUSE_LOCAL -q "select count() from file('$ERRORS_FILE', CSV)"
+rm $ERRORS_FILE
+
+rm $FILE
+
diff --git a/tests/queries/0_stateless/02919_storage_fuzzjson.reference b/tests/queries/0_stateless/02919_storage_fuzzjson.reference
index a134ce52c11..8f4ee4a5615 100644
--- a/tests/queries/0_stateless/02919_storage_fuzzjson.reference
+++ b/tests/queries/0_stateless/02919_storage_fuzzjson.reference
@@ -1,3 +1,4 @@
 100
 100
 100
+100	100
diff --git a/tests/queries/0_stateless/02919_storage_fuzzjson.sql b/tests/queries/0_stateless/02919_storage_fuzzjson.sql
index 80b4a406a08..bf473f4b6b8 100644
--- a/tests/queries/0_stateless/02919_storage_fuzzjson.sql
+++ b/tests/queries/0_stateless/02919_storage_fuzzjson.sql
@@ -42,3 +42,24 @@ CREATE TABLE 02919_test_table_reuse_args(str String) ENGINE = FuzzJSON(
 SELECT count() FROM (SELECT * FROM 02919_test_table_reuse_args LIMIT 100);
 
 DROP TABLE IF EXISTS 02919_test_table_reuse_args;
+
+--
+DROP TABLE IF EXISTS 02919_test_table_invalid_col_type;
+CREATE TABLE 02919_test_table_invalid_col_type
+(
+   str Nullable(Int64)
+)
+ENGINE = FuzzJSON('{"pet":"rat"}', NULL); -- { serverError BAD_ARGUMENTS }
+
+DROP TABLE IF EXISTS 02919_test_table_invalid_col_type;
+
+--
+DROP TABLE IF EXISTS 02919_test_multi_col;
+CREATE TABLE 02919_test_multi_col
+(
+    str1 String,
+    str2 String
+) ENGINE = FuzzJSON('{"pet":"rat"}', 999);
+
+SELECT count(str1), count(str2) FROM (SELECT str1, str2 FROM 02919_test_multi_col LIMIT 100);
+DROP TABLE IF EXISTS 02919_test_multi_col;
diff --git a/tests/queries/0_stateless/02920_fix_json_merge_patch.reference b/tests/queries/0_stateless/02920_fix_json_merge_patch.reference
new file mode 100644
index 00000000000..a309a488ab7
--- /dev/null
+++ b/tests/queries/0_stateless/02920_fix_json_merge_patch.reference
@@ -0,0 +1 @@
+{"id":1,"foo":["bar"]}	{"id":1,"foo":["bar","baz"]}
diff --git a/tests/queries/0_stateless/02920_fix_json_merge_patch.sql b/tests/queries/0_stateless/02920_fix_json_merge_patch.sql
new file mode 100644
index 00000000000..d51a7833dac
--- /dev/null
+++ b/tests/queries/0_stateless/02920_fix_json_merge_patch.sql
@@ -0,0 +1,3 @@
+-- Tags: no-fasttest
+
+select '{"id":1,"foo":["bar"]}' as a, jsonMergePatch(a,toJSONString(map('foo',arrayPushBack(arrayMap(x->JSONExtractString(x),JSONExtractArrayRaw(a, 'foo')),'baz')))) as b;
diff --git a/tests/queries/0_stateless/02920_unary_operators_functions.reference b/tests/queries/0_stateless/02920_unary_operators_functions.reference
new file mode 100644
index 00000000000..0cfbf08886f
--- /dev/null
+++ b/tests/queries/0_stateless/02920_unary_operators_functions.reference
@@ -0,0 +1 @@
+2
diff --git a/tests/queries/0_stateless/02920_unary_operators_functions.sql b/tests/queries/0_stateless/02920_unary_operators_functions.sql
new file mode 100644
index 00000000000..3f3c3a1618a
--- /dev/null
+++ b/tests/queries/0_stateless/02920_unary_operators_functions.sql
@@ -0,0 +1 @@
+SELECT NOT (0) + NOT (0);
\ No newline at end of file
diff --git a/tests/queries/0_stateless/02922_analyzer_aggregate_nothing_type.sql b/tests/queries/0_stateless/02922_analyzer_aggregate_nothing_type.sql
index 987515527f0..a064c091df0 100644
--- a/tests/queries/0_stateless/02922_analyzer_aggregate_nothing_type.sql
+++ b/tests/queries/0_stateless/02922_analyzer_aggregate_nothing_type.sql
@@ -11,7 +11,7 @@ SET
     allow_experimental_parallel_reading_from_replicas=1,
     max_parallel_replicas=2,
     use_hedged_requests=0,
-    cluster_for_parallel_replicas='parallel_replicas',
+    cluster_for_parallel_replicas='test_cluster_one_shard_three_replicas_localhost',
     parallel_replicas_for_non_replicated_merge_tree=1
 ;
 
diff --git a/tests/queries/0_stateless/02930_client_file_log_comment.reference b/tests/queries/0_stateless/02930_client_file_log_comment.reference
index 09639302c0f..c380ac1d6fe 100644
--- a/tests/queries/0_stateless/02930_client_file_log_comment.reference
+++ b/tests/queries/0_stateless/02930_client_file_log_comment.reference
@@ -1,4 +1,6 @@
 42
-select 42\n	/dev/stdin
 4242
-select 4242\n	foo
+424242
+select 42	clickhouse.default-1.sql
+select 4242	clickhouse.default-2.sql
+select 424242\n	foo
diff --git a/tests/queries/0_stateless/02930_client_file_log_comment.sh b/tests/queries/0_stateless/02930_client_file_log_comment.sh
index c425f28ecbe..3d0df6de9b4 100755
--- a/tests/queries/0_stateless/02930_client_file_log_comment.sh
+++ b/tests/queries/0_stateless/02930_client_file_log_comment.sh
@@ -6,14 +6,19 @@ CLICKHOUSE_LOG_COMMENT=
 # shellcheck source=../shell_config.sh
 . "$CUR_DIR"/../shell_config.sh
 
-$CLICKHOUSE_CLIENT --queries-file /dev/stdin <<<'select 42'
-$CLICKHOUSE_CLIENT -nm -q "
-    system flush logs;
-    select query, log_comment from system.query_log where current_database = '$CLICKHOUSE_DATABASE' and event_date >= yesterday() and query = 'select 42\n' and type != 'QueryStart';
-"
+file1="$CUR_DIR/clickhouse.${CLICKHOUSE_DATABASE}-1.sql"
+echo -n 'select 42' >> "$file1"
+file2="$CUR_DIR/clickhouse.${CLICKHOUSE_DATABASE}-2.sql"
+echo -n 'select 4242' >> "$file2"
+
+$CLICKHOUSE_CLIENT --queries-file "$file1" "$file2" <<<'select 42'
+$CLICKHOUSE_CLIENT --log_comment foo --queries-file /dev/stdin <<<'select 424242'
 
-$CLICKHOUSE_CLIENT --log_comment foo --queries-file /dev/stdin <<<'select 4242'
 $CLICKHOUSE_CLIENT -nm -q "
     system flush logs;
-    select query, log_comment from system.query_log where current_database = '$CLICKHOUSE_DATABASE' and event_date >= yesterday() and query = 'select 4242\n' and type != 'QueryStart';
-"
+    select query, log_comment from system.query_log where current_database = '$CLICKHOUSE_DATABASE' and event_date >= yesterday() and query = 'select 42' and type != 'QueryStart';
+    select query, log_comment from system.query_log where current_database = '$CLICKHOUSE_DATABASE' and event_date >= yesterday() and query = 'select 4242' and type != 'QueryStart';
+    select query, log_comment from system.query_log where current_database = '$CLICKHOUSE_DATABASE' and event_date >= yesterday() and query = 'select 424242\n' and type != 'QueryStart';
+" | sed "s#$CUR_DIR/##"
+
+rm "$file1" "$file2"
diff --git a/tests/queries/0_stateless/02931_client_fuzzy_search_crash.expect b/tests/queries/0_stateless/02931_client_fuzzy_search_crash.expect
new file mode 100755
index 00000000000..18acaf86a4b
--- /dev/null
+++ b/tests/queries/0_stateless/02931_client_fuzzy_search_crash.expect
@@ -0,0 +1,59 @@
+#!/usr/bin/expect -f
+
+set basedir [file dirname $argv0]
+set basename [file tail $argv0]
+exp_internal -f $env(CLICKHOUSE_TMP)/$basename.debuglog 0
+set history_file $env(CLICKHOUSE_TMP)/$basename.history
+
+log_user 0
+set timeout 60
+match_max 100000
+
+expect_after {
+    # Do not ignore eof from expect
+    -i $any_spawn_id eof { exp_continue }
+    # A default timeout action is to do nothing, change it to fail
+    -i $any_spawn_id timeout { exit 1 }
+}
+
+spawn bash -c "source $basedir/../shell_config.sh ; \$CLICKHOUSE_CLIENT_BINARY \$CLICKHOUSE_CLIENT_OPT --disable_suggestion --history_file=$history_file"
+expect ":) "
+
+# send Ctrl-R (octal code of R is 022, see ascii(7))
+send -- "\022"
+# we cannot use "expect" for skim, since it dups the fd, and expect will not catch it
+sleep 1
+
+# trigger a crash https://github.com/lotabout/tuikit/pull/51 via "pasting" "R;"
+send -- "\33\[200~R;\33\[201~"
+# usually this should be enough
+sleep 1
+
+# only panic info is written to regular stderr, so we are checking that it is not there
+set is_panicked 0
+set max_iterations 3
+set timeout 1
+while {$is_panicked == 0 && $max_iterations >= 0} {
+    expect {
+        "panic" {
+            set is_panicked 1
+        }
+        default {
+            # Reset the expect_after
+        }
+    }
+    set max_iterations [expr $max_iterations-1];
+}
+if {$is_panicked} {
+    send_user "Panicked\n"
+    exit 1
+}
+
+set timeout 60
+
+# Ctrl-C
+send -- "\3"
+expect ":)"
+
+send "exit\r"
+expect eof
diff --git a/tests/queries/0_stateless/02931_client_fuzzy_search_crash.reference b/tests/queries/0_stateless/02931_client_fuzzy_search_crash.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02931_file_cluster.sh b/tests/queries/0_stateless/02931_file_cluster.sh
index e628687a42a..8566e2ab08e 100755
--- a/tests/queries/0_stateless/02931_file_cluster.sh
+++ b/tests/queries/0_stateless/02931_file_cluster.sh
@@ -4,7 +4,7 @@ CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
 # shellcheck source=../shell_config.sh
 . "$CURDIR"/../shell_config.sh
 
-USER_FILES_PATH=$(clickhouse-client --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
+USER_FILES_PATH=$($CLICKHOUSE_CLIENT_BINARY --query "select _path,_file from file('nonexist.txt', 'CSV', 'val1 char')" 2>&1 | grep Exception | awk '{gsub("/nonexist.txt","",$9); print $9}')
 
 mkdir -p "${USER_FILES_PATH}"/"${CLICKHOUSE_TEST_UNIQUE_NAME}"/
 
diff --git a/tests/queries/0_stateless/02931_max_num_to_warn.reference b/tests/queries/0_stateless/02931_max_num_to_warn.reference
new file mode 100644
index 00000000000..c0ad7354039
--- /dev/null
+++ b/tests/queries/0_stateless/02931_max_num_to_warn.reference
@@ -0,0 +1,3 @@
+The number of attached tables is more than 10
+The number of attached databases is more than 10
+The number of active parts is more than 10
diff --git a/tests/queries/0_stateless/02931_max_num_to_warn.sql b/tests/queries/0_stateless/02931_max_num_to_warn.sql
new file mode 100644
index 00000000000..49b981fc355
--- /dev/null
+++ b/tests/queries/0_stateless/02931_max_num_to_warn.sql
@@ -0,0 +1,53 @@
+-- Tags: no-parallel
+
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_02931;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_1 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_2 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_3 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_4 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_5 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_6 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_7 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_8 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_9 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_10 (id Int32, str String) Engine=Memory;
+CREATE TABLE IF NOT EXISTS test_max_num_to_warn_02931.test_max_num_to_warn_11 (id Int32, str String) Engine=Memory;
+
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_1;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_2;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_3;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_4;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_5;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_6;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_7;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_8;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_9;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_10;
+CREATE DATABASE IF NOT EXISTS test_max_num_to_warn_11;
+
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_1 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_2 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_3 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_4 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_5 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_6 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_7 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_8 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_9 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_10 VALUES (1, 'Hello');
+INSERT INTO test_max_num_to_warn_02931.test_max_num_to_warn_11 VALUES (1, 'Hello');
+
+SELECT * FROM system.warnings where message in ('The number of attached tables is more than 10', 'The number of attached databases is more than 10', 'The number of active parts is more than 10');
+
+DROP DATABASE IF EXISTS test_max_num_to_warn_02931;
+DROP DATABASE IF EXISTS test_max_num_to_warn_1;
+DROP DATABASE IF EXISTS test_max_num_to_warn_2;
+DROP DATABASE IF EXISTS test_max_num_to_warn_3;
+DROP DATABASE IF EXISTS test_max_num_to_warn_4;
+DROP DATABASE IF EXISTS test_max_num_to_warn_5;
+DROP DATABASE IF EXISTS test_max_num_to_warn_6;
+DROP DATABASE IF EXISTS test_max_num_to_warn_7;
+DROP DATABASE IF EXISTS test_max_num_to_warn_8;
+DROP DATABASE IF EXISTS test_max_num_to_warn_9;
+DROP DATABASE IF EXISTS test_max_num_to_warn_10;
+DROP DATABASE IF EXISTS test_max_num_to_warn_11;
diff --git a/tests/queries/0_stateless/02931_size_virtual_column_use_structure_from_insertion_table.sh b/tests/queries/0_stateless/02931_size_virtual_column_use_structure_from_insertion_table.sh
index 27ef26dd9a5..d9e4a2c8f8b 100755
--- a/tests/queries/0_stateless/02931_size_virtual_column_use_structure_from_insertion_table.sh
+++ b/tests/queries/0_stateless/02931_size_virtual_column_use_structure_from_insertion_table.sh
@@ -10,4 +10,4 @@ create table test (x UInt64, y UInt32, size UInt64) engine=Memory;
 insert into test select c1, c2, _size from file('$CLICKHOUSE_TEST_UNIQUE_NAME.csv') settings use_structure_from_insertion_table_in_table_functions=1;
 select * from test;
 "
-
+rm $CLICKHOUSE_TEST_UNIQUE_NAME.csv
diff --git a/tests/queries/0_stateless/02932_apply_deleted_mask.reference b/tests/queries/0_stateless/02932_apply_deleted_mask.reference
new file mode 100644
index 00000000000..22499472f84
--- /dev/null
+++ b/tests/queries/0_stateless/02932_apply_deleted_mask.reference
@@ -0,0 +1,15 @@
+Inserted
+100	4950
+10	100	0
+Lighweight deleted
+86	4271
+10	100	10
+Mask applied
+86	4271
+10	86	0
+Lighweight deleted
+72	3578
+10	86	10
+Mask applied in partition
+72	3578
+10	84	9
diff --git a/tests/queries/0_stateless/02932_apply_deleted_mask.sql b/tests/queries/0_stateless/02932_apply_deleted_mask.sql
new file mode 100644
index 00000000000..0ada0640a8f
--- /dev/null
+++ b/tests/queries/0_stateless/02932_apply_deleted_mask.sql
@@ -0,0 +1,43 @@
+DROP TABLE IF EXISTS t_materialize_delete;
+
+CREATE TABLE t_materialize_delete (id UInt64, v UInt64)
+ENGINE = MergeTree ORDER BY id PARTITION BY id % 10;
+
+SET mutations_sync = 2;
+
+INSERT INTO t_materialize_delete SELECT number, number FROM numbers(100);
+
+SELECT 'Inserted';
+
+SELECT count(), sum(v) FROM t_materialize_delete;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_materialize_delete' AND active;
+
+SELECT 'Lighweight deleted';
+
+DELETE FROM t_materialize_delete WHERE id % 7 = 3;
+
+SELECT count(), sum(v) FROM t_materialize_delete;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_materialize_delete' AND active;
+
+SELECT 'Mask applied';
+
+ALTER TABLE t_materialize_delete APPLY DELETED MASK;
+
+SELECT count(), sum(v) FROM t_materialize_delete;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_materialize_delete' AND active;
+
+SELECT 'Lighweight deleted';
+
+DELETE FROM t_materialize_delete WHERE id % 7 = 4;
+
+SELECT count(), sum(v) FROM t_materialize_delete;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_materialize_delete' AND active;
+
+SELECT 'Mask applied in partition';
+
+ALTER TABLE t_materialize_delete APPLY DELETED MASK IN PARTITION 5;
+
+SELECT count(), sum(v) FROM t_materialize_delete;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_materialize_delete' AND active;
+
+DROP TABLE t_materialize_delete;
diff --git a/tests/queries/0_stateless/02932_kill_query_sleep.reference b/tests/queries/0_stateless/02932_kill_query_sleep.reference
new file mode 100644
index 00000000000..9c19635a83f
--- /dev/null
+++ b/tests/queries/0_stateless/02932_kill_query_sleep.reference
@@ -0,0 +1,2 @@
+Cancelling query
+QUERY_WAS_CANCELLED
diff --git a/tests/queries/0_stateless/02932_kill_query_sleep.sh b/tests/queries/0_stateless/02932_kill_query_sleep.sh
new file mode 100755
index 00000000000..08c375b875d
--- /dev/null
+++ b/tests/queries/0_stateless/02932_kill_query_sleep.sh
@@ -0,0 +1,39 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+
+function wait_query_started()
+{
+    local query_id="$1"
+    $CLICKHOUSE_CLIENT --query "SYSTEM FLUSH LOGS"
+    while [[ $($CLICKHOUSE_CLIENT --query="SELECT count() FROM system.query_log WHERE query_id='$query_id' AND current_database = currentDatabase()") == 0 ]]; do
+        sleep 0.1;
+        $CLICKHOUSE_CLIENT --query "SYSTEM FLUSH LOGS;"
+    done
+}
+
+function kill_query()
+{
+    local query_id="$1"
+    $CLICKHOUSE_CLIENT --query "KILL QUERY WHERE query_id='$query_id'" >/dev/null
+    while [[ $($CLICKHOUSE_CLIENT --query="SELECT count() FROM system.processes WHERE query_id='$query_id'") != 0 ]]; do sleep 0.1; done
+}
+
+
+sleep_query_id="sleep_query_id_02932_kill_query_sleep_${CLICKHOUSE_DATABASE}_$RANDOM"
+
+# This sleep query wants to sleep for 1000 seconds (which is too long).
+# We're going to cancel this query later.
+sleep_query="SELECT sleep(1000)"
+
+$CLICKHOUSE_CLIENT --query_id="$sleep_query_id" --function_sleep_max_microseconds_per_block="1000000000" --query "$sleep_query" >/dev/null 2>&1 &
+wait_query_started "$sleep_query_id"
+
+echo "Cancelling query"
+kill_query "$sleep_query_id"
+
+$CLICKHOUSE_CLIENT --query "SYSTEM FLUSH LOGS;"
+$CLICKHOUSE_CLIENT --query "SELECT exception FROM system.query_log WHERE query_id='$sleep_query_id' AND current_database = currentDatabase()" | grep -oF "QUERY_WAS_CANCELLED"
diff --git a/tests/queries/0_stateless/02932_lwd_and_mutations.reference b/tests/queries/0_stateless/02932_lwd_and_mutations.reference
new file mode 100644
index 00000000000..dc0d3536b8f
--- /dev/null
+++ b/tests/queries/0_stateless/02932_lwd_and_mutations.reference
@@ -0,0 +1,14 @@
+900	0	[1,2,3,4,5,6,7,8,9]
+1	1000	1
+800	200	[2,3,4,5,6,7,8,9]
+1	800	0
+700	150	[3,4,5,6,7,8,9]
+1	800	1
+600	300	[4,5,6,7,8,9]
+1	600	0
+400	200	[6,7,8,9]
+1	500	1
+200	100	[8,9]
+1	300	1
+200	100	[8,9]
+1	200	0
diff --git a/tests/queries/0_stateless/02932_lwd_and_mutations.sql b/tests/queries/0_stateless/02932_lwd_and_mutations.sql
new file mode 100644
index 00000000000..a68aca91764
--- /dev/null
+++ b/tests/queries/0_stateless/02932_lwd_and_mutations.sql
@@ -0,0 +1,43 @@
+DROP TABLE IF EXISTS t_lwd_mutations;
+
+CREATE TABLE t_lwd_mutations(id UInt64, v UInt64) ENGINE = MergeTree ORDER BY id;
+INSERT INTO t_lwd_mutations SELECT number, 0 FROM numbers(1000);
+
+SET mutations_sync = 2;
+
+DELETE FROM t_lwd_mutations WHERE id % 10 = 0;
+
+SELECT count(), sum(v), arraySort(groupUniqArray(id % 10)) FROM t_lwd_mutations;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_lwd_mutations' AND active;
+
+ALTER TABLE t_lwd_mutations UPDATE v = 1 WHERE id % 4 = 0, DELETE WHERE id % 10 = 1;
+
+SELECT count(), sum(v), arraySort(groupUniqArray(id % 10)) FROM t_lwd_mutations;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_lwd_mutations' AND active;
+
+DELETE FROM t_lwd_mutations WHERE id % 10 = 2;
+
+SELECT count(), sum(v), arraySort(groupUniqArray(id % 10)) FROM t_lwd_mutations;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_lwd_mutations' AND active;
+
+ALTER TABLE t_lwd_mutations UPDATE v = 1 WHERE id % 4 = 1, DELETE WHERE id % 10 = 3;
+
+SELECT count(), sum(v), arraySort(groupUniqArray(id % 10)) FROM t_lwd_mutations;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_lwd_mutations' AND active;
+
+ALTER TABLE t_lwd_mutations UPDATE _row_exists = 0 WHERE id % 10 = 4, DELETE WHERE id % 10 = 5;
+
+SELECT count(), sum(v), arraySort(groupUniqArray(id % 10)) FROM t_lwd_mutations;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_lwd_mutations' AND active;
+
+ALTER TABLE t_lwd_mutations DELETE WHERE id % 10 = 6, UPDATE _row_exists = 0 WHERE id % 10 = 7;
+
+SELECT count(), sum(v), arraySort(groupUniqArray(id % 10)) FROM t_lwd_mutations;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_lwd_mutations' AND active;
+
+ALTER TABLE t_lwd_mutations APPLY DELETED MASK;
+
+SELECT count(), sum(v), arraySort(groupUniqArray(id % 10)) FROM t_lwd_mutations;
+SELECT count(), sum(rows), sum(has_lightweight_delete) FROM system.parts WHERE database = currentDatabase() AND table = 't_lwd_mutations' AND active;
+
+DROP TABLE IF EXISTS t_lwd_mutations;
diff --git a/tests/queries/1_stateful/00180_no_seek_avoiding_when_reading_from_cache.reference b/tests/queries/0_stateless/02932_non_ready_set_stuck.reference
similarity index 80%
rename from tests/queries/1_stateful/00180_no_seek_avoiding_when_reading_from_cache.reference
rename to tests/queries/0_stateless/02932_non_ready_set_stuck.reference
index d05b1f927f4..fc39e7c9b45 100644
--- a/tests/queries/1_stateful/00180_no_seek_avoiding_when_reading_from_cache.reference
+++ b/tests/queries/0_stateless/02932_non_ready_set_stuck.reference
@@ -1 +1,2 @@
+
 0	0
diff --git a/tests/queries/0_stateless/02932_non_ready_set_stuck.sql b/tests/queries/0_stateless/02932_non_ready_set_stuck.sql
new file mode 100644
index 00000000000..c04f8f18751
--- /dev/null
+++ b/tests/queries/0_stateless/02932_non_ready_set_stuck.sql
@@ -0,0 +1,2 @@
+CREATE TABLE tab (item_id UInt64, price_sold Nullable(Float32), date Date) ENGINE = MergeTree ORDER BY item_id;
+SELECT * FROM (SELECT item_id FROM tab GROUP BY item_id WITH TOTALS ORDER BY '922337203.6854775806' IN (SELECT NULL)) AS l RIGHT JOIN (SELECT item_id FROM tab) AS r ON l.item_id = r.item_id WHERE NULL;
diff --git a/tests/queries/0_stateless/02932_parallel_replicas_fuzzer.reference b/tests/queries/0_stateless/02932_parallel_replicas_fuzzer.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02932_parallel_replicas_fuzzer.sql b/tests/queries/0_stateless/02932_parallel_replicas_fuzzer.sql
new file mode 100644
index 00000000000..3daaf36188a
--- /dev/null
+++ b/tests/queries/0_stateless/02932_parallel_replicas_fuzzer.sql
@@ -0,0 +1,38 @@
+SET parallel_replicas_for_non_replicated_merge_tree=1;
+
+-- https://github.com/ClickHouse/ClickHouse/issues/49559
+CREATE TABLE join_inner_table__fuzz_146 (`id` UUID, `key` String, `number` Int64, `value1` String, `value2` String, `time` Nullable(Int64)) ENGINE = MergeTree ORDER BY (id, number, key);
+INSERT INTO join_inner_table__fuzz_146 SELECT CAST('833c9e22-c245-4eb5-8745-117a9a1f26b1', 'UUID') AS id, CAST(rowNumberInAllBlocks(), 'String') AS key, * FROM generateRandom('number Int64, value1 String, value2 String, time Int64', 1, 10, 2) LIMIT 100;
+SELECT key, value1, value2, toUInt64(min(time)) AS start_ts FROM join_inner_table__fuzz_146 GROUP BY key, value1, value2 WITH CUBE ORDER BY key ASC NULLS LAST, value2 DESC NULLS LAST LIMIT 9223372036854775806
+    FORMAT Null
+    SETTINGS
+        max_parallel_replicas = 3,
+        prefer_localhost_replica = 1,
+        cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost',
+        allow_experimental_parallel_reading_from_replicas = 1,
+        use_hedged_requests = 0;
+
+
+-- https://github.com/ClickHouse/ClickHouse/issues/48496
+CREATE TABLE t_02709__fuzz_23 (`key` Nullable(UInt8), `sign` Int8, `date` DateTime64(3)) ENGINE = CollapsingMergeTree(sign) PARTITION BY date ORDER BY key SETTINGS allow_nullable_key=1;
+INSERT INTO t_02709__fuzz_23 values (1, 1, '2023-12-01 00:00:00.000');
+SELECT NULL FROM t_02709__fuzz_23 FINAL
+GROUP BY sign, '1023'
+ORDER BY nan DESC, [0, NULL, NULL, NULL, NULL] DESC
+FORMAT Null
+SETTINGS
+    max_parallel_replicas = 3,
+    allow_experimental_parallel_reading_from_replicas = 1,
+    use_hedged_requests = 0,
+    cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost';
+
+SELECT _CAST(NULL, 'Nullable(Nothing)') AS `NULL`
+FROM t_02709__fuzz_23 FINAL
+GROUP BY
+    t_02709__fuzz_23.sign,
+    '1023'
+ORDER BY
+    nan DESC,
+    _CAST([0, NULL, NULL, NULL, NULL], 'Array(Nullable(UInt8))') DESC
+FORMAT Null
+SETTINGS receive_timeout = 10., receive_data_timeout_ms = 10000, use_hedged_requests = 0, allow_suspicious_low_cardinality_types = 1, max_parallel_replicas = 3, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, log_queries = 1, table_function_remote_max_addresses = 200, allow_experimental_analyzer = 1;
diff --git a/tests/queries/0_stateless/02932_query_settings_max_size_drop.reference b/tests/queries/0_stateless/02932_query_settings_max_size_drop.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02932_query_settings_max_size_drop.sql b/tests/queries/0_stateless/02932_query_settings_max_size_drop.sql
new file mode 100644
index 00000000000..1685861bd2e
--- /dev/null
+++ b/tests/queries/0_stateless/02932_query_settings_max_size_drop.sql
@@ -0,0 +1,31 @@
+CREATE TABLE test_max_size_drop
+Engine = MergeTree()
+ORDER BY number
+AS SELECT number
+FROM numbers(1000)
+;
+
+DROP TABLE test_max_size_drop SETTINGS max_table_size_to_drop = 1; -- { serverError 359 }
+DROP TABLE test_max_size_drop;
+
+CREATE TABLE test_max_size_drop
+Engine = MergeTree()
+ORDER BY number
+AS SELECT number
+FROM numbers(1000)
+;
+
+ALTER TABLE test_max_size_drop DROP PARTITION tuple() SETTINGS max_partition_size_to_drop = 1; -- { serverError 359 }
+ALTER TABLE test_max_size_drop DROP PARTITION tuple();
+DROP TABLE test_max_size_drop;
+
+CREATE TABLE test_max_size_drop
+Engine = MergeTree()
+ORDER BY number
+AS SELECT number
+FROM numbers(1000)
+;
+
+ALTER TABLE test_max_size_drop DROP PART 'all_1_1_0' SETTINGS max_partition_size_to_drop = 1; -- { serverError 359 }
+ALTER TABLE test_max_size_drop DROP PART 'all_1_1_0';
+DROP TABLE test_max_size_drop;
diff --git a/tests/queries/0_stateless/02932_refreshable_materialized_views.reference b/tests/queries/0_stateless/02932_refreshable_materialized_views.reference
new file mode 100644
index 00000000000..4c5b678cfa5
--- /dev/null
+++ b/tests/queries/0_stateless/02932_refreshable_materialized_views.reference
@@ -0,0 +1,44 @@
+<1: created view>	a	[]		1
+CREATE MATERIALIZED VIEW default.a\nREFRESH AFTER 1 SECOND\n(\n    `x` UInt64\n)\nENGINE = Memory AS\nSELECT number AS x\nFROM numbers(2)\nUNION ALL\nSELECT rand64() AS x
+<2: refreshed>	3	1	1
+<3: time difference at least>	500
+<4: next refresh in>	1
+<4.5: altered>	Scheduled	Finished	2052-01-01 00:00:00
+CREATE MATERIALIZED VIEW default.a\nREFRESH EVERY 2 YEAR\n(\n    `x` Int16\n)\nENGINE = Memory AS\nSELECT x * 2 AS x\nFROM default.src
+<5: no refresh>	3
+<6: refreshed>	2
+<7: refreshed>	Scheduled	Finished	2054-01-01 00:00:00
+CREATE MATERIALIZED VIEW default.b\nREFRESH EVERY 2 YEAR DEPENDS ON default.a\n(\n    `y` Int32\n)\nENGINE = MergeTree\nORDER BY y\nSETTINGS index_granularity = 8192 AS\nSELECT x * 10 AS y\nFROM default.a
+<8: refreshed>	20
+<9: refreshed>	a	Scheduled	Finished	2054-01-01 00:00:00
+<9: refreshed>	b	Scheduled	Finished	2054-01-01 00:00:00
+<10: waiting>	a	Scheduled	[]	2054-01-01 00:00:00
+<10: waiting>	b	WaitingForDependencies	['default.a']	2054-01-01 00:00:00
+<11: chain-refreshed a>	4
+<12: chain-refreshed b>	40
+<13: chain-refreshed>	a	Scheduled	[]	Finished	2054-01-01 00:00:01	2056-01-01 00:00:00	
+<13: chain-refreshed>	b	Scheduled	['default.a']	Finished	2054-01-24 23:22:21	2056-01-01 00:00:00	
+<14: waiting for next cycle>	a	Scheduled	[]	2058-01-01 00:00:00
+<14: waiting for next cycle>	b	WaitingForDependencies	['default.a']	2060-01-01 00:00:00
+<15: chain-refreshed a>	6
+<16: chain-refreshed b>	60
+<17: chain-refreshed>	a	Scheduled	2062-01-01 00:00:00
+<17: chain-refreshed>	b	Scheduled	2062-01-01 00:00:00
+<18: removed dependency>	b	Scheduled	[]	2062-03-03 03:03:03	2064-01-01 00:00:00	5
+CREATE MATERIALIZED VIEW default.b\nREFRESH EVERY 2 YEAR\n(\n    `y` Int32\n)\nENGINE = MergeTree\nORDER BY y\nSETTINGS index_granularity = 8192 AS\nSELECT x * 10 AS y\nFROM default.a
+<19: exception>	1
+<20: unexception>	1
+<21: rename>	1
+<22: rename>	d	Finished
+<23: simple refresh>	1
+<24: rename during refresh>	1
+<25: rename during refresh>	f	Running
+<27: cancelled>	f	Scheduled
+CREATE MATERIALIZED VIEW default.g\nREFRESH EVERY 1 WEEK OFFSET 3 DAY 4 HOUR RANDOMIZE FOR 4 DAY 1 HOUR\n(\n    `x` Int64\n)\nENGINE = Memory AS\nSELECT 42
+<29: randomize>	1	1
+CREATE MATERIALIZED VIEW default.h\nREFRESH EVERY 1 SECOND TO default.dest\n(\n    `x` Int64\n) AS\nSELECT x * 10 AS x\nFROM default.src
+<30: to existing table>	10
+<31: to existing table>	10
+<31: to existing table>	20
+<32: empty>	i	Scheduled	Unknown
+<32: empty>	j	Scheduled	Finished
diff --git a/tests/queries/0_stateless/02932_refreshable_materialized_views.sh b/tests/queries/0_stateless/02932_refreshable_materialized_views.sh
new file mode 100755
index 00000000000..8daea063fc5
--- /dev/null
+++ b/tests/queries/0_stateless/02932_refreshable_materialized_views.sh
@@ -0,0 +1,303 @@
+#!/usr/bin/env bash
+# Tags: atomic-database
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# reset --log_comment
+CLICKHOUSE_LOG_COMMENT=
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+# Set session timezone to UTC to make all DateTime formatting and parsing use UTC, because refresh
+# scheduling is done in UTC.
+CLICKHOUSE_CLIENT="`echo "$CLICKHOUSE_CLIENT" | sed 's/--session_timezone[= ][^ ]*//g'`"
+CLICKHOUSE_CLIENT="`echo "$CLICKHOUSE_CLIENT --allow_experimental_refreshable_materialized_view=1 --session_timezone Etc/UTC"`"
+
+$CLICKHOUSE_CLIENT -nq "create view refreshes as select * from system.view_refreshes where database = '$CLICKHOUSE_DATABASE' order by view"
+
+
+# Basic refreshing.
+$CLICKHOUSE_CLIENT -nq "
+    create materialized view a
+        refresh after 1 second
+        engine Memory
+        empty
+        as select number as x from numbers(2) union all select rand64() as x"
+$CLICKHOUSE_CLIENT -nq "select '<1: created view>', view, remaining_dependencies, exception, last_refresh_result in ('Unknown', 'Finished') from refreshes";
+$CLICKHOUSE_CLIENT -nq "show create a"
+# Wait for any refresh. (xargs trims the string and turns \t and \n into spaces)
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_result from refreshes -- $LINENO" | xargs`" == 'Unknown' ]
+do
+    sleep 0.1
+done
+# Check table contents.
+$CLICKHOUSE_CLIENT -nq "select '<2: refreshed>', count(), sum(x=0), sum(x=1) from a"
+# Wait for table contents to change.
+res1="`$CLICKHOUSE_CLIENT -nq 'select * from a order by x format Values'`"
+while :
+do
+    res2="`$CLICKHOUSE_CLIENT -nq 'select * from a order by x format Values -- $LINENO'`"
+    [ "$res2" == "$res1" ] || break
+    sleep 0.1
+done
+time2="`$CLICKHOUSE_CLIENT -nq "select reinterpret(now64(), 'Int64')"`"
+# Wait for another change.
+while :
+do
+    res3="`$CLICKHOUSE_CLIENT -nq 'select * from a order by x format Values -- $LINENO'`"
+    [ "$res3" == "$res2" ] || break
+    sleep 0.1
+done
+# Check that the two changes were at least 500ms apart, in particular that we're not refreshing
+# like crazy. This is potentially flaky, but we need at least one test that uses non-mocked timer
+# to make sure the clock+timer code works at all. If it turns out flaky, increase refresh period above.
+$CLICKHOUSE_CLIENT -nq "
+    select '<3: time difference at least>', min2(reinterpret(now64(), 'Int64') - $time2, 500);
+    select '<4: next refresh in>', next_refresh_time-last_refresh_time from refreshes;"
+
+# Create a source table from which views will read.
+$CLICKHOUSE_CLIENT -nq "
+    create table src (x Int8) engine Memory as select 1"
+
+# Switch to fake clock, change refresh schedule, change query.
+$CLICKHOUSE_CLIENT -nq "
+    system test view a set fake time '2050-01-01 00:00:01';"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status, last_refresh_time, next_refresh_time from refreshes -- $LINENO" | xargs`" != 'Scheduled 2050-01-01 00:00:01 2050-01-01 00:00:02' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    alter table a modify refresh every 2 year;
+    alter table a modify query select x*2 as x from src;
+    select '<4.5: altered>', status, last_refresh_result, next_refresh_time from refreshes;
+    show create a;"
+# Advance time to trigger the refresh.
+$CLICKHOUSE_CLIENT -nq "
+    select '<5: no refresh>', count() from a;
+    system test view a set fake time '2052-02-03 04:05:06';"
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_time from refreshes -- $LINENO" | xargs`" != '2052-02-03 04:05:06' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    select '<6: refreshed>', * from a;
+    select '<7: refreshed>', status, last_refresh_result, next_refresh_time from refreshes;"
+
+# Create a dependent view, refresh it once.
+$CLICKHOUSE_CLIENT -nq "
+    create materialized view b refresh every 2 year depends on a (y Int32) engine MergeTree order by y empty as select x*10 as y from a;
+    show create b;
+    system test view b set fake time '2052-11-11 11:11:11';
+    system refresh view b;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_time from refreshes where view = 'b' -- $LINENO" | xargs`" != '2052-11-11 11:11:11' ]
+do
+    sleep 0.1
+done
+# Next refresh shouldn't start until the dependency refreshes.
+$CLICKHOUSE_CLIENT -nq "
+    select '<8: refreshed>', * from b;
+    select '<9: refreshed>', view, status, last_refresh_result, next_refresh_time from refreshes;
+    system test view b set fake time '2054-01-24 23:22:21';"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status, next_refresh_time from refreshes where view = 'b' -- $LINENO" | xargs`" != 'WaitingForDependencies 2054-01-01 00:00:00' ]
+do
+    sleep 0.1
+done
+# Update source table (by dropping and re-creating it - to test that tables are looked up by name
+# rather than uuid), kick off refresh of the dependency.
+$CLICKHOUSE_CLIENT -nq "
+    select '<10: waiting>', view, status, remaining_dependencies, next_refresh_time from refreshes;
+    drop table src;
+    create table src (x Int16) engine Memory as select 2;
+    system test view a set fake time '2054-01-01 00:00:01';"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status from refreshes where view = 'b' -- $LINENO" | xargs`" != 'Scheduled' ]
+do
+    sleep 0.1
+done
+# Both tables should've refreshed.
+$CLICKHOUSE_CLIENT -nq "
+    select '<11: chain-refreshed a>', * from a;
+    select '<12: chain-refreshed b>', * from b;
+    select '<13: chain-refreshed>', view, status, remaining_dependencies, last_refresh_result, last_refresh_time, next_refresh_time, exception from refreshes;"
+
+# Make the dependent table run ahead by one refresh cycle, make sure it waits for the dependency to
+# catch up to the same cycle.
+$CLICKHOUSE_CLIENT -nq "
+    system test view b set fake time '2059-01-01 00:00:00';
+    system refresh view b;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select next_refresh_time from refreshes where view = 'b' -- $LINENO" | xargs`" != '2060-01-01 00:00:00' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    system test view b set fake time '2061-01-01 00:00:00';
+    system test view a set fake time '2057-01-01 00:00:00';"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status, next_refresh_time from refreshes -- $LINENO" | xargs`" != 'Scheduled 2058-01-01 00:00:00 WaitingForDependencies 2060-01-01 00:00:00' ]
+do
+    sleep 0.1
+done
+sleep 1
+$CLICKHOUSE_CLIENT -nq "
+    select '<14: waiting for next cycle>', view, status, remaining_dependencies, next_refresh_time from refreshes;
+    truncate src;
+    insert into src values (3);
+    system test view a set fake time '2060-02-02 02:02:02';"
+while [ "`$CLICKHOUSE_CLIENT -nq "select next_refresh_time from refreshes where view = 'b' -- $LINENO" | xargs`" != '2062-01-01 00:00:00' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    select '<15: chain-refreshed a>', * from a;
+    select '<16: chain-refreshed b>', * from b;
+    select '<17: chain-refreshed>', view, status, next_refresh_time from refreshes;"
+
+# Get to WaitingForDependencies state and remove the depencency.
+$CLICKHOUSE_CLIENT -nq "
+    system test view b set fake time '2062-03-03 03:03:03'"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status from refreshes where view = 'b' -- $LINENO" | xargs`" != 'WaitingForDependencies' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    alter table b modify refresh every 2 year"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status, last_refresh_time from refreshes where view = 'b' -- $LINENO" | xargs`" != 'Scheduled 2062-03-03 03:03:03' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    select '<18: removed dependency>', view, status, remaining_dependencies, last_refresh_time,next_refresh_time, refresh_count from refreshes where view = 'b';
+    show create b;"
+
+# Select from a table that doesn't exist, get an exception.
+$CLICKHOUSE_CLIENT -nq "
+    drop table a;
+    drop table b;
+    create materialized view c refresh every 1 second (x Int64) engine Memory empty as select * from src;
+    drop table src;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_result from refreshes -- $LINENO" | xargs`" != 'Exception' ]
+do
+    sleep 0.1
+done
+# Check exception, create src, expect successful refresh.
+$CLICKHOUSE_CLIENT -nq "
+    select '<19: exception>', exception ilike '%UNKNOWN_TABLE%' from refreshes;
+    create table src (x Int64) engine Memory as select 1;
+    system refresh view c;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_result from refreshes -- $LINENO" | xargs`" != 'Finished' ]
+do
+    sleep 0.1
+done
+# Rename table.
+$CLICKHOUSE_CLIENT -nq "
+    select '<20: unexception>', * from c;
+    rename table c to d;
+    select '<21: rename>', * from d;
+    select '<22: rename>', view, last_refresh_result from refreshes;"
+
+# Do various things during a refresh.
+# First make a nonempty view.
+$CLICKHOUSE_CLIENT -nq "
+    drop table d;
+    truncate src;
+    insert into src values (1)
+    create materialized view e refresh every 1 second (x Int64) engine MergeTree order by x empty as select x + sleepEachRow(1) as x from src settings max_block_size = 1;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_result from refreshes -- $LINENO" | xargs`" != 'Finished' ]
+do
+    sleep 0.1
+done
+# Stop refreshes.
+$CLICKHOUSE_CLIENT -nq "
+    select '<23: simple refresh>', * from e;
+    system stop view e;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status from refreshes -- $LINENO" | xargs`" != 'Disabled' ]
+do
+    sleep 0.1
+done
+# Make refreshes slow, wait for a slow refresh to start. (We stopped refreshes first to make sure
+# we wait for a slow refresh, not a previous fast one.)
+$CLICKHOUSE_CLIENT -nq "
+    insert into src select * from numbers(1000) settings max_block_size=1;
+    system start view e;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status from refreshes -- $LINENO" | xargs`" != 'Running' ]
+do
+    sleep 0.1
+done
+# Rename.
+$CLICKHOUSE_CLIENT -nq "
+    rename table e to f;
+    select '<24: rename during refresh>', * from f;
+    select '<25: rename during refresh>', view, status from refreshes;
+    alter table f modify refresh after 10 year;"
+sleep 2 # make it likely that at least one row was processed
+# Cancel.
+$CLICKHOUSE_CLIENT -nq "
+    system cancel view f;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_result from refreshes -- $LINENO" | xargs`" != 'Cancelled' ]
+do
+    sleep 0.1
+done
+# Check that another refresh doesn't immediately start after the cancelled one.
+sleep 1
+$CLICKHOUSE_CLIENT -nq "
+    select '<27: cancelled>', view, status from refreshes;
+    system refresh view f;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select status from refreshes -- $LINENO" | xargs`" != 'Running' ]
+do
+    sleep 0.1
+done
+# Drop.
+$CLICKHOUSE_CLIENT -nq "
+    drop table f;
+    select '<28: drop during refresh>', view, status from refreshes;"
+
+# Try OFFSET and RANDOMIZE FOR.
+$CLICKHOUSE_CLIENT -nq "
+    create materialized view g refresh every 1 week offset 3 day 4 hour randomize for 4 day 1 hour (x Int64) engine Memory empty as select 42;
+    show create g;
+    system test view g set fake time '2050-02-03 15:30:13';"
+while [ "`$CLICKHOUSE_CLIENT -nq "select next_refresh_time > '2049-01-01' from refreshes -- $LINENO" | xargs`" != '1' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    with '2050-02-10 04:00:00'::DateTime as expected
+    select '<29: randomize>', abs(next_refresh_time::Int64 - expected::Int64) <= 3600*(24*4+1), next_refresh_time != expected from refreshes;"
+
+# Send data 'TO' an existing table.
+$CLICKHOUSE_CLIENT -nq "
+    drop table g;
+    create table dest (x Int64) engine MergeTree order by x;
+    truncate src;
+    insert into src values (1);
+    create materialized view h refresh every 1 second to dest empty as select x*10 as x from src;
+    show create h;"
+while [ "`$CLICKHOUSE_CLIENT -nq "select last_refresh_result from refreshes -- $LINENO" | xargs`" != 'Finished' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    select '<30: to existing table>', * from dest;
+    insert into src values (2);"
+while [ "`$CLICKHOUSE_CLIENT -nq "select count() from dest -- $LINENO" | xargs`" != '2' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    select '<31: to existing table>', * from dest;
+    drop table dest;
+    drop table src;
+    drop table h;"
+
+# EMPTY
+$CLICKHOUSE_CLIENT -nq "
+    create materialized view i refresh after 1 year engine Memory empty as select number as x from numbers(2);
+    create materialized view j refresh after 1 year engine Memory as select number as x from numbers(2)"
+while [ "`$CLICKHOUSE_CLIENT -nq "select sum(last_success_time is null) from refreshes -- $LINENO" | xargs`" == '2' ]
+do
+    sleep 0.1
+done
+$CLICKHOUSE_CLIENT -nq "
+    select '<32: empty>', view, status, last_refresh_result from refreshes order by view;
+    drop table i;
+    drop table j"
+
+$CLICKHOUSE_CLIENT -nq "
+    drop table refreshes;"
diff --git a/tests/queries/0_stateless/02933_change_cache_setting_without_restart.reference b/tests/queries/0_stateless/02933_change_cache_setting_without_restart.reference
new file mode 100644
index 00000000000..17a25d82824
--- /dev/null
+++ b/tests/queries/0_stateless/02933_change_cache_setting_without_restart.reference
@@ -0,0 +1,7 @@
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02933/	0	0	0	16
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02933/	10	1000	0	16
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02933/	5	1000	0	16
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02933/	15	1000	0	16
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02933/	2	1000	0	16
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02933/	0	1000	0	16
+134217728	10000000	33554432	4194304	1	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02933/	0	0	0	16
diff --git a/tests/queries/0_stateless/02933_change_cache_setting_without_restart.sh b/tests/queries/0_stateless/02933_change_cache_setting_without_restart.sh
new file mode 100755
index 00000000000..ddad7a1904b
--- /dev/null
+++ b/tests/queries/0_stateless/02933_change_cache_setting_without_restart.sh
@@ -0,0 +1,65 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-parallel, no-s3-storage
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+disk_name="s3_cache_02933"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+config_path=/etc/clickhouse-server/config.d/storage_conf.xml
+config_path_tmp=$config_path.tmp
+
+cat $config_path \
+| sed "s|<background_download_threads>0<\/background_download_threads>|<background_download_threads>10<\/background_download_threads>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+cat $config_path \
+| sed "s|<background_download_queue_size_limit>0<\/background_download_queue_size_limit>|<background_download_queue_size_limit>1000<\/background_download_queue_size_limit>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT --query "SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+cat $config_path \
+| sed "s|<background_download_threads>10<\/background_download_threads>|<background_download_threads>5<\/background_download_threads>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT --query "SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+cat $config_path \
+| sed "s|<background_download_threads>5<\/background_download_threads>|<background_download_threads>15<\/background_download_threads>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT --query "SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+cat $config_path \
+| sed "s|<background_download_threads>15<\/background_download_threads>|<background_download_threads>2<\/background_download_threads>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT --query "SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+cat $config_path \
+| sed "s|<background_download_threads>2<\/background_download_threads>|<background_download_threads>0<\/background_download_threads>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT --query "SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+cat $config_path \
+| sed "s|<background_download_queue_size_limit>1000<\/background_download_queue_size_limit>|<background_download_queue_size_limit>0<\/background_download_queue_size_limit>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT --query "SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
diff --git a/tests/queries/0_stateless/02933_ephemeral_mv.reference b/tests/queries/0_stateless/02933_ephemeral_mv.reference
new file mode 100644
index 00000000000..a77853390d3
--- /dev/null
+++ b/tests/queries/0_stateless/02933_ephemeral_mv.reference
@@ -0,0 +1,2 @@
+3	3
+42	42
diff --git a/tests/queries/0_stateless/02933_ephemeral_mv.sql b/tests/queries/0_stateless/02933_ephemeral_mv.sql
new file mode 100644
index 00000000000..d0725d894f0
--- /dev/null
+++ b/tests/queries/0_stateless/02933_ephemeral_mv.sql
@@ -0,0 +1,30 @@
+
+CREATE TABLE raw
+(
+  name String,
+  num String
+) ENGINE = MergeTree
+ORDER BY (name);
+
+CREATE TABLE parsed_eph
+(
+  name String,
+  num_ephemeral UInt32 EPHEMERAL,
+  num UInt32 MATERIALIZED num_ephemeral,
+) ENGINE = MergeTree
+ORDER BY (name);
+
+CREATE MATERIALIZED VIEW parse_mv_eph
+TO parsed_eph
+AS
+SELECT
+  name,
+  toUInt32(num) as num_ephemeral
+FROM raw;
+
+INSERT INTO raw VALUES ('3', '3'), ('42', '42');
+SELECT name, num FROM parsed_eph;
+
+DROP VIEW parse_mv_eph;
+DROP TABLE parsed_eph;
+DROP TABLE raw;
diff --git a/tests/queries/0_stateless/02933_group_by_memory_usage.reference b/tests/queries/0_stateless/02933_group_by_memory_usage.reference
new file mode 100644
index 00000000000..1481fcaa297
--- /dev/null
+++ b/tests/queries/0_stateless/02933_group_by_memory_usage.reference
@@ -0,0 +1,3 @@
+Spin up a long running query
+1	1	1	1	1
+0
diff --git a/tests/queries/0_stateless/02933_group_by_memory_usage.sh b/tests/queries/0_stateless/02933_group_by_memory_usage.sh
new file mode 100755
index 00000000000..bb1bbbf16a2
--- /dev/null
+++ b/tests/queries/0_stateless/02933_group_by_memory_usage.sh
@@ -0,0 +1,13 @@
+#!/usr/bin/env bash
+# Tags: long, no-random-settings
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+query_id="group-by-mem-usage-$CLICKHOUSE_DATABASE"
+
+echo "Spin up a long running query"
+${CLICKHOUSE_CLIENT} --query "with q as (select length(groupArray(toString(number))) as x  from numbers_mt(2e6) group by number order by x limit 1), q1 as (select * from q), q2 as (select * from q), q3 as (select * from q), q4 as (select * from q) select * from q, q1, q2, q3, q4 settings max_bytes_before_external_group_by='1G', max_memory_usage='2G'" --query_id "$query_id"
+${CLICKHOUSE_CLIENT} --query "system flush logs"
+${CLICKHOUSE_CLIENT} --query "select ProfileEvents['ExternalAggregationWritePart'] from system.query_log where current_database = currentDatabase() and type = 'QueryFinish' and query_id = '$query_id' and event_date >= today() - 1"
diff --git a/tests/queries/0_stateless/02933_local_system_setting.reference b/tests/queries/0_stateless/02933_local_system_setting.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02933_local_system_setting.sh b/tests/queries/0_stateless/02933_local_system_setting.sh
new file mode 100755
index 00000000000..c6d19f2445f
--- /dev/null
+++ b/tests/queries/0_stateless/02933_local_system_setting.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL -q "select * from system.server_settings format Null;"
diff --git a/tests/queries/0_stateless/02933_paste_join.reference b/tests/queries/0_stateless/02933_paste_join.reference
new file mode 100644
index 00000000000..84ae5987926
--- /dev/null
+++ b/tests/queries/0_stateless/02933_paste_join.reference
@@ -0,0 +1,74 @@
+0	0
+1	1
+2	2
+3	3
+4	4
+5	5
+6	6
+7	7
+8	8
+9	9
+0	9
+1	8
+2	7
+3	6
+4	5
+5	4
+6	3
+7	2
+8	1
+9	0
+1	2
+0	0
+1	1
+2	2
+3	3
+4	4
+5	5
+6	0
+7	1
+8	2
+9	3
+10	4
+0	0
+1	1
+0	0	0	0
+1	1	1	1
+2	2	2	2
+3	3	3	3
+4	4	4	4
+5	5	5	5
+6	6	6	6
+7	7	7	7
+8	8	8	8
+9	9	9	9
+10	10	10	10
+11	11	11	11
+12	12	12	12
+13	13	13	13
+14	14	14	14
+15	15	15	15
+16	16	16	16
+17	17	17	17
+18	18	18	18
+19	19	19	19
+20	20	20	20
+21	21	21	21
+22	22	22	22
+23	23	23	23
+24	24	24	24
+25	25	25	25
+26	26	26	26
+27	27	27	27
+28	28	28	28
+29	29	29	29
+UInt64
+UInt64
+UInt64
+UInt64
+UInt64
+UInt64
+UInt64
+UInt64
+UInt64
+UInt64
diff --git a/tests/queries/0_stateless/02933_paste_join.sql b/tests/queries/0_stateless/02933_paste_join.sql
new file mode 100644
index 00000000000..1c346438d77
--- /dev/null
+++ b/tests/queries/0_stateless/02933_paste_join.sql
@@ -0,0 +1,37 @@
+select * from (SELECT number as a FROM numbers(10)) t1 PASTE JOIN (select number as a from numbers(10)) t2;
+select * from (SELECT number as a FROM numbers(10)) t1 PASTE JOIN (select number as a from numbers(10) order by a desc) t2;
+create table if not exists test (num UInt64) engine=Memory;
+insert into test select number from numbers(6);
+insert into test select number from numbers(5);
+SELECT * FROM (SELECT 1) t1 PASTE JOIN (SELECT 2) SETTINGS joined_subquery_requires_alias=0;
+select * from (SELECT number as a FROM numbers(11)) t1 PASTE JOIN test t2 SETTINGS max_threads=1;
+select * from (SELECT number as a FROM numbers(11)) t1 PASTE JOIN (select * from test limit 2) t2 SETTINGs max_threads=1;
+CREATE TABLE t1 (a UInt64, b UInt64) ENGINE = Memory;
+INSERT INTO t1 SELECT number, number FROM numbers(0, 3);
+INSERT INTO t1 SELECT number, number FROM numbers(3, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(5, 7);
+INSERT INTO t1 SELECT number, number FROM numbers(12, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(14, 1);
+INSERT INTO t1 SELECT number, number FROM numbers(15, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(17, 1);
+INSERT INTO t1 SELECT number, number FROM numbers(18, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(20, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(22, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(24, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(26, 2);
+INSERT INTO t1 SELECT number, number FROM numbers(28, 2);
+
+
+CREATE TABLE t2 (a UInt64, b UInt64) ENGINE = Memory;
+INSERT INTO t2 SELECT number, number FROM numbers(0, 2);
+INSERT INTO t2 SELECT number, number FROM numbers(2, 3);
+INSERT INTO t2 SELECT number, number FROM numbers(5, 5);
+INSERT INTO t2 SELECT number, number FROM numbers(10, 5);
+INSERT INTO t2 SELECT number, number FROM numbers(15, 15);
+
+SELECT * FROM ( SELECT * from t1 ) t1 PASTE JOIN ( SELECT * from t2 ) t2 SETTINGS max_threads = 1;
+SELECT toTypeName(a) FROM (SELECT number as a FROM numbers(11)) t1 PASTE JOIN (select number as a from numbers(10)) t2 SETTINGS join_use_nulls = 1;
+SET max_threads = 2;
+select * from (SELECT number as a FROM numbers(10)) t1 ANY PASTE JOIN (select number as a from numbers(10)) t2; -- { clientError SYNTAX_ERROR }
+select * from (SELECT number as a FROM numbers(10)) t1 ALL PASTE JOIN (select number as a from numbers(10)) t2; -- { clientError SYNTAX_ERROR }
+select * from (SELECT number as a FROM numbers_mt(10)) t1 PASTE JOIN (select number as a from numbers(10) ORDER BY a DESC) t2 SETTINGS max_block_size=3; -- { serverError BAD_ARGUMENTS }
diff --git a/tests/queries/0_stateless/02933_replicated_database_forbid_create_as_select.reference b/tests/queries/0_stateless/02933_replicated_database_forbid_create_as_select.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/02933_replicated_database_forbid_create_as_select.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/02933_replicated_database_forbid_create_as_select.sh b/tests/queries/0_stateless/02933_replicated_database_forbid_create_as_select.sh
new file mode 100755
index 00000000000..c295f5be43b
--- /dev/null
+++ b/tests/queries/0_stateless/02933_replicated_database_forbid_create_as_select.sh
@@ -0,0 +1,16 @@
+#!/usr/bin/env bash
+# Tags: replica
+
+# CREATE AS SELECT for Replicated database is broken (https://github.com/ClickHouse/ClickHouse/issues/35408).
+# This should be fixed and this test should eventually be deleted.
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_CLIENT} --allow_experimental_database_replicated=1 --query "CREATE DATABASE ${CLICKHOUSE_DATABASE}_db engine = Replicated('/clickhouse/databases/${CLICKHOUSE_TEST_ZOOKEEPER_PREFIX}/${CLICKHOUSE_DATABASE}_db', '{shard}', '{replica}')"
+# Non-replicated engines are allowed
+${CLICKHOUSE_CLIENT} --distributed_ddl_output_mode=none --query "CREATE TABLE ${CLICKHOUSE_DATABASE}_db.test (id UInt64) ENGINE = MergeTree() ORDER BY id AS SELECT 1"
+# Replicated storafes are forbidden
+${CLICKHOUSE_CLIENT} --query "CREATE TABLE ${CLICKHOUSE_DATABASE}_db.test2 (id UInt64) ENGINE = ReplicatedMergeTree('/clickhouse/$CLICKHOUSE_TEST_ZOOKEEPER_PREFIX/test2', '1') ORDER BY id AS SELECT 1" |& grep -cm1 "SUPPORT_IS_DISABLED"
+${CLICKHOUSE_CLIENT} --query "DROP DATABASE ${CLICKHOUSE_DATABASE}_db"
diff --git a/tests/queries/0_stateless/02933_sqid.sql b/tests/queries/0_stateless/02933_sqid.sql
index db8b2f29ee8..3a2873e9c34 100644
--- a/tests/queries/0_stateless/02933_sqid.sql
+++ b/tests/queries/0_stateless/02933_sqid.sql
@@ -1,6 +1,5 @@
 -- Tags: no-fasttest
 
-SET allow_experimental_hash_functions = 1;
 SET allow_suspicious_low_cardinality_types = 1;
 
 SELECT '-- negative tests';
diff --git a/tests/queries/0_stateless/02934_merge_tree_max_projections.reference b/tests/queries/0_stateless/02934_merge_tree_max_projections.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02934_merge_tree_max_projections.sql b/tests/queries/0_stateless/02934_merge_tree_max_projections.sql
new file mode 100644
index 00000000000..6ed3bc44295
--- /dev/null
+++ b/tests/queries/0_stateless/02934_merge_tree_max_projections.sql
@@ -0,0 +1,39 @@
+DROP TABLE IF EXISTS test_max_mt_projections_alter;
+CREATE TABLE test_max_mt_projections_alter (c1 UInt32, c2 UInt32, c3 UInt32)
+        ENGINE = MergeTree ORDER BY c1
+        SETTINGS max_projections = 3;
+
+ALTER TABLE test_max_mt_projections_alter ADD PROJECTION p1 (SELECT c2 ORDER BY c2);
+ALTER TABLE test_max_mt_projections_alter ADD PROJECTION p2 (SELECT c3 ORDER BY c3);
+ALTER TABLE test_max_mt_projections_alter ADD PROJECTION p3 (SELECT c1, c2 ORDER BY c1, c2);
+
+ALTER TABLE test_max_mt_projections_alter
+        ADD PROJECTION p4 (SELECT c2, c3 ORDER BY c2, c3); -- { serverError LIMIT_EXCEEDED }
+
+ALTER TABLE test_max_mt_projections_alter DROP PROJECTION p3;
+
+ALTER TABLE test_max_mt_projections_alter ADD PROJECTION p4 (SELECT c2, c3 ORDER BY c2, c3);
+
+DROP TABLE IF EXISTS test_max_mt_projections_alter;
+
+DROP TABLE IF EXISTS test_max_mt_projections_create;
+CREATE TABLE test_max_mt_projections_create (c1 UInt32, c2 UInt32,
+        PROJECTION p1 (SELECT c1, c2 ORDER BY c2),
+        PROJECTION p2 (SELECT c2 ORDER BY c2))
+        ENGINE = MergeTree ORDER BY c1
+        SETTINGS max_projections = 1; -- { serverError LIMIT_EXCEEDED }
+
+CREATE TABLE test_max_mt_projections_create (c1 UInt32, c2 UInt32,
+        PROJECTION p (SELECT c1, c2 ORDER BY c2))
+        ENGINE = MergeTree ORDER BY c1
+        SETTINGS max_projections = 0; -- { serverError LIMIT_EXCEEDED }
+
+CREATE TABLE test_max_mt_projections_create (c1 UInt32, c2 UInt32,
+        PROJECTION p (SELECT c1, c2 ORDER BY c2))
+        ENGINE = MergeTree ORDER BY c1
+        SETTINGS max_projections = 1;
+
+ALTER TABLE test_max_mt_projections_create
+        ADD PROJECTION p2 (SELECT c2 ORDER BY c2); -- { serverError LIMIT_EXCEEDED }
+
+DROP TABLE IF EXISTS test_max_mt_projections_create;
diff --git a/tests/queries/0_stateless/02935_date_trunc_case_unsensitiveness.reference b/tests/queries/0_stateless/02935_date_trunc_case_unsensitiveness.reference
new file mode 100644
index 00000000000..c8e3d37f08b
--- /dev/null
+++ b/tests/queries/0_stateless/02935_date_trunc_case_unsensitiveness.reference
@@ -0,0 +1,9 @@
+2022-03-01 00:00:00
+2022-03-01
+2022-02-28
+2022-03-01 00:00:00
+2022-03-01
+2022-02-28
+2022-03-01 00:00:00
+2022-03-01
+2022-02-28
diff --git a/tests/queries/0_stateless/02935_date_trunc_case_unsensitiveness.sql b/tests/queries/0_stateless/02935_date_trunc_case_unsensitiveness.sql
new file mode 100644
index 00000000000..ecf6877d477
--- /dev/null
+++ b/tests/queries/0_stateless/02935_date_trunc_case_unsensitiveness.sql
@@ -0,0 +1,9 @@
+SELECT dateTrunc('DAY', toDateTime('2022-03-01 12:55:55'));
+SELECT dateTrunc('MONTH', toDateTime64('2022-03-01 12:55:55', 2));
+SELECT dateTrunc('WEEK', toDate('2022-03-01'));
+SELECT dateTrunc('Day', toDateTime('2022-03-01 12:55:55'));
+SELECT dateTrunc('Month', toDateTime64('2022-03-01 12:55:55', 2));
+SELECT dateTrunc('Week', toDate('2022-03-01'));
+SELECT dateTrunc('day', toDateTime('2022-03-01 12:55:55'));
+SELECT dateTrunc('month', toDateTime64('2022-03-01 12:55:55', 2));
+SELECT dateTrunc('week', toDate('2022-03-01'));
diff --git a/tests/queries/0_stateless/02935_format_with_arbitrary_types.reference b/tests/queries/0_stateless/02935_format_with_arbitrary_types.reference
new file mode 100644
index 00000000000..3455adc8723
--- /dev/null
+++ b/tests/queries/0_stateless/02935_format_with_arbitrary_types.reference
@@ -0,0 +1,70 @@
+-- Const string + non-const arbitrary type
+The answer to all questions is 42.
+The answer to all questions is 43.
+The answer to all questions is 44.
+The answer to all questions is 45.
+The answer to all questions is 46.
+The answer to all questions is 47.
+The answer to all questions is 48.
+The answer to all questions is 49.
+The answer to all questions is 50.
+The answer to all questions is 51.
+The answer to all questions is 52.
+The answer to all questions is 53.
+The answer to all questions is 42.42.
+The answer to all questions is 43.43.
+The answer to all questions is 44.
+The answer to all questions is true.
+The answer to all questions is false.
+The answer to all questions is foo.
+The answer to all questions is bar.
+The answer to all questions is foo.
+The answer to all questions is bar.
+The answer to all questions is foo.
+The answer to all questions is bar.
+The answer to all questions is foo.
+The answer to all questions is bar.
+The answer to all questions is 42.
+The answer to all questions is 42.
+The answer to all questions is fae310ca-d52a-4923-9e9b-02bf67f4b009.
+The answer to all questions is 2023-11-14.
+The answer to all questions is 2123-11-14.
+The answer to all questions is 2023-11-14 05:50:12.
+The answer to all questions is 2023-11-14 05:50:12.123.
+The answer to all questions is hallo.
+The answer to all questions is [\'foo\',\'bar\'].
+The answer to all questions is {"foo":"bar"}.
+The answer to all questions is (42,\'foo\').
+The answer to all questions is {42:\'foo\'}.
+The answer to all questions is 122.233.64.201.
+The answer to all questions is 2001:1:130f:2:3:9c0:876a:130b.
+The answer to all questions is (42,43).
+The answer to all questions is [(0,0),(10,0),(10,10),(0,10)].
+The answer to all questions is [[(20,20),(50,20),(50,50),(20,50)],[(30,30),(50,50),(50,30)]].
+The answer to all questions is [[[(0,0),(10,0),(10,10),(0,10)]],[[(20,20),(50,20),(50,50),(20,50)],[(30,30),(50,50),(50,30)]]].
+-- Nested
+The [\'foo\',\'bar\'] to all questions is [\'qaz\',\'qux\'].
+-- NULL arguments
+\N
+\N
+\N
+\N
+\N
+\N
+\N
+-- Various arguments tests
+The Non-const to all questions is  strings
+The Two arguments  to all questions is test
+The Three  to all questions is arguments and  test
+The 3 to all questions is  arguments test and  with int type
+The 42 to all questions is 144
+The 42 to all questions is 144 and 255
+The 42 to all questions is 144
+The 42 to all questions is 144 and 255
+-- Single argument tests
+The answer to all questions is 42.
+The answer to all questions is 42.
+The answer to all questions is foo.
+The answer to all questions is foo.
+\N
+\N
diff --git a/tests/queries/0_stateless/02935_format_with_arbitrary_types.sql b/tests/queries/0_stateless/02935_format_with_arbitrary_types.sql
new file mode 100644
index 00000000000..ad1de2bec6d
--- /dev/null
+++ b/tests/queries/0_stateless/02935_format_with_arbitrary_types.sql
@@ -0,0 +1,85 @@
+
+-- Tags: no-fasttest
+-- no-fasttest: json type needs rapidjson library, geo types need s2 geometry
+
+SET allow_experimental_object_type = 1;
+SET allow_suspicious_low_cardinality_types=1;
+
+SELECT '-- Const string + non-const arbitrary type';
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(42 :: Int8));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(43 :: Int16));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(44 :: Int32));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(45 :: Int64));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(46 :: Int128));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(47 :: Int256));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(48 :: UInt8));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(49 :: UInt16));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(50 :: UInt32));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(51 :: UInt64));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(52 :: UInt128));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(53 :: UInt256));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(42.42 :: Float32));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(43.43 :: Float64));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(44.44 :: Decimal(2)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(true :: Bool));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(false :: Bool));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('foo' :: String));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('bar' :: FixedString(3)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('foo' :: Nullable(String)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('bar' :: Nullable(FixedString(3))));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('foo' :: LowCardinality(String)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('bar' :: LowCardinality(FixedString(3))));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('foo' :: LowCardinality(Nullable(String))));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('bar' :: LowCardinality(Nullable(FixedString(3)))));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(42 :: LowCardinality(Nullable(UInt32))));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(42 :: LowCardinality(UInt32)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('fae310ca-d52a-4923-9e9b-02bf67f4b009' :: UUID));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('2023-11-14' :: Date));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('2123-11-14' :: Date32));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('2023-11-14 05:50:12' :: DateTime('Europe/Amsterdam')));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('2023-11-14 05:50:12.123' :: DateTime64(3, 'Europe/Amsterdam')));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('hallo' :: Enum('hallo' = 1)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(['foo', 'bar'] :: Array(String)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('{"foo": "bar"}' :: JSON));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize((42, 'foo') :: Tuple(Int32, String)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize(map(42, 'foo') :: Map(Int32, String)));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('122.233.64.201' :: IPv4));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize('2001:0001:130F:0002:0003:09C0:876A:130B' :: IPv6));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize((42, 43) :: Point));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize([(0,0),(10,0),(10,10),(0,10)] :: Ring));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize([[(20, 20), (50, 20), (50, 50), (20, 50)], [(30, 30), (50, 50), (50, 30)]] :: Polygon));
+SELECT format('The {0} to all questions is {1}.', 'answer', materialize([[[(0, 0), (10, 0), (10, 10), (0, 10)]], [[(20, 20), (50, 20), (50, 50), (20, 50)],[(30, 30), (50, 50), (50, 30)]]] :: MultiPolygon));
+
+SELECT '-- Nested';
+DROP TABLE IF EXISTS format_nested;
+CREATE TABLE format_nested(attrs Nested(k String, v String)) ENGINE = MergeTree ORDER BY tuple();
+INSERT INTO format_nested VALUES (['foo', 'bar'], ['qaz', 'qux']);
+SELECT format('The {0} to all questions is {1}.', attrs.k, attrs.v) FROM format_nested;
+DROP TABLE format_nested;
+
+SELECT '-- NULL arguments';
+SELECT format('The {0} to all questions is {1}', NULL, NULL);
+SELECT format('The {0} to all questions is {1}', NULL, materialize(NULL :: Nullable(UInt64)));
+SELECT format('The {0} to all questions is {1}', materialize(NULL :: Nullable(UInt64)), materialize(NULL :: Nullable(UInt64)));
+SELECT format('The {0} to all questions is {1}', 42, materialize(NULL :: Nullable(UInt64)));
+SELECT format('The {0} to all questions is {1}', '42', materialize(NULL :: Nullable(UInt64)));
+SELECT format('The {0} to all questions is {1}', 42, materialize(NULL :: Nullable(UInt64)), materialize(NULL :: Nullable(UInt64)));
+SELECT format('The {0} to all questions is {1}', '42', materialize(NULL :: Nullable(UInt64)), materialize(NULL :: Nullable(UInt64)));
+
+SELECT '-- Various arguments tests';
+SELECT format('The {0} to all questions is {1}', materialize('Non-const'), materialize(' strings'));
+SELECT format('The {0} to all questions is {1}', 'Two arguments ', 'test');
+SELECT format('The {0} to all questions is {1} and {2}', 'Three ', 'arguments', ' test');
+SELECT format('The {0} to all questions is {1} and {2}', materialize(3 :: Int64), ' arguments test', ' with int type');
+SELECT format('The {0} to all questions is {1}', materialize(42 :: Int32), materialize(144 :: UInt64));
+SELECT format('The {0} to all questions is {1} and {2}', materialize(42 :: Int32), materialize(144 :: UInt64), materialize(255 :: UInt32));
+SELECT format('The {0} to all questions is {1}', 42, 144);
+SELECT format('The {0} to all questions is {1} and {2}', 42, 144, 255);
+
+SELECT '-- Single argument tests';
+SELECT format('The answer to all questions is {0}.', 42);
+SELECT format('The answer to all questions is {0}.', materialize(42));
+SELECT format('The answer to all questions is {0}.', 'foo');
+SELECT format('The answer to all questions is {0}.', materialize('foo'));
+SELECT format('The answer to all questions is {0}.', NULL);
+SELECT format('The answer to all questions is {0}.', materialize(NULL :: Nullable(UInt64)));
diff --git a/tests/queries/0_stateless/02935_http_content_type_with_http_headers_progress.reference b/tests/queries/0_stateless/02935_http_content_type_with_http_headers_progress.reference
new file mode 100644
index 00000000000..d847d4e22ef
--- /dev/null
+++ b/tests/queries/0_stateless/02935_http_content_type_with_http_headers_progress.reference
@@ -0,0 +1,24 @@
+TSV
+ Content-Type: text/tab-separated-values; charset=UTF-8
+TabSeparatedWithNamesAndTypes
+ Content-Type: text/tab-separated-values; charset=UTF-8
+CSV
+ Content-Type: text/csv; charset=UTF-8; header=absent
+CSVWithNames
+ Content-Type: text/csv; charset=UTF-8; header=present
+Null
+ Content-Type: text/plain; charset=UTF-8
+Native
+ Content-Type: application/octet-stream
+RowBinary
+ Content-Type: application/octet-stream
+JSONStrings
+ Content-Type: application/json; charset=UTF-8
+JSON
+ Content-Type: application/json; charset=UTF-8
+JSONEachRow
+ Content-Type: application/x-ndjson; charset=UTF-8
+Values
+ Content-Type: text/plain; charset=UTF-8
+Vertical
+ Content-Type: text/plain; charset=UTF-8
diff --git a/tests/queries/0_stateless/02935_http_content_type_with_http_headers_progress.sh b/tests/queries/0_stateless/02935_http_content_type_with_http_headers_progress.sh
new file mode 100755
index 00000000000..cd705650bad
--- /dev/null
+++ b/tests/queries/0_stateless/02935_http_content_type_with_http_headers_progress.sh
@@ -0,0 +1,13 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+for frmt in TSV TabSeparatedWithNamesAndTypes CSV CSVWithNames Null Native RowBinary JSONStrings JSON JSONEachRow Values Vertical
+do
+  echo $frmt
+  url="${CLICKHOUSE_URL}/?http_headers_progress_interval_ms=1&send_progress_in_http_headers=true&query=select+sleepEachRow(0.01)from+numbers(10)+FORMAT+${frmt}"
+  (seq 1 200| xargs -n1 -P0 -Ixxx curl -Ss -v -o /dev/null ${url} 2>&1|grep -Eo " Content-Type:.*$")|strings|sort -u
+done
+
diff --git a/tests/queries/0_stateless/02935_ipv6_bit_operations.reference b/tests/queries/0_stateless/02935_ipv6_bit_operations.reference
new file mode 100644
index 00000000000..22d5cda0a39
--- /dev/null
+++ b/tests/queries/0_stateless/02935_ipv6_bit_operations.reference
@@ -0,0 +1 @@
+11111111111111110000000000000000111111111111111100000000000000001111111111111111000000000000000011111111111111110000000000000000	00000000000000001111111111111111000000000000000011111111111111110000000000000000111111111111111100000000000000001111111111111111	10101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010	01010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101010101	10101010101010100000000000000000101010101010101000000000000000001010101010101010000000000000000010101010101010100000000000000000	10101010101010100000000000000000101010101010101000000000000000001010101010101010000000000000000010101010101010100000000000000000	1010101010101010000000000000000010101010101010100000000000000000101010101010101000000000000000001010101010101010	1010101010101010000000000000000010101010101010100000000000000000101010101010101000000000000000001010101010101010	01010101010101010000000000000000010101010101010100000000000000000101010101010101000000000000000001010101010101010000000000000000	01010101010101010000000000000000010101010101010100000000000000000101010101010101000000000000000001010101010101010000000000000000	0101010101010101000000000000000001010101010101010000000000000000010101010101010100000000000000000101010101010101	0101010101010101000000000000000001010101010101010000000000000000010101010101010100000000000000000101010101010101	11111111111111111010101010101010111111111111111110101010101010101111111111111111101010101010101011111111111111111010101010101010	11111111111111111010101010101010111111111111111110101010101010101111111111111111101010101010101011111111111111111010101010101010	10101010101010101111111111111111101010101010101011111111111111111010101010101010111111111111111110101010101010101111111111111111	10101010101010101111111111111111101010101010101011111111111111111010101010101010111111111111111110101010101010101111111111111111	11111111111111110101010101010101111111111111111101010101010101011111111111111111010101010101010111111111111111110101010101010101	11111111111111110101010101010101111111111111111101010101010101011111111111111111010101010101010111111111111111110101010101010101	01010101010101011111111111111111010101010101010111111111111111110101010101010101111111111111111101010101010101011111111111111111	01010101010101011111111111111111010101010101010111111111111111110101010101010101111111111111111101010101010101011111111111111111
diff --git a/tests/queries/0_stateless/02935_ipv6_bit_operations.sql b/tests/queries/0_stateless/02935_ipv6_bit_operations.sql
new file mode 100644
index 00000000000..6598c2ac539
--- /dev/null
+++ b/tests/queries/0_stateless/02935_ipv6_bit_operations.sql
@@ -0,0 +1,7 @@
+WITH toIPv6('FFFF:0000:FFFF:0000:FFFF:0000:FFFF:0000') AS ip1, toIPv6('0000:FFFF:0000:FFFF:0000:FFFF:0000:FFFF') AS ip2,
+     CAST('226854911280625642308916404954512140970', 'UInt128') AS n1, CAST('113427455640312821154458202477256070485', 'UInt128') AS n2
+SELECT bin(ip1), bin(ip2), bin(n1), bin(n2),
+       bin(bitAnd(ip1, n1)), bin(bitAnd(n1, ip1)), bin(bitAnd(ip2, n1)), bin(bitAnd(n1, ip2)),
+       bin(bitAnd(ip1, n2)), bin(bitAnd(n2, ip1)), bin(bitAnd(ip2, n2)), bin(bitAnd(n2, ip2)),
+       bin(bitOr(ip1, n1)), bin(bitOr(n1, ip1)), bin(bitOr(ip2, n1)), bin(bitOr(n1, ip2)),
+       bin(bitOr(ip1, n2)), bin(bitOr(n2, ip1)), bin(bitOr(ip2, n2)), bin(bitOr(n2, ip2));
diff --git a/tests/queries/0_stateless/02935_parallel_replicas_settings.reference b/tests/queries/0_stateless/02935_parallel_replicas_settings.reference
new file mode 100644
index 00000000000..846d77bfa57
--- /dev/null
+++ b/tests/queries/0_stateless/02935_parallel_replicas_settings.reference
@@ -0,0 +1,4 @@
+10
+1
+10
+1
diff --git a/tests/queries/0_stateless/02935_parallel_replicas_settings.sql b/tests/queries/0_stateless/02935_parallel_replicas_settings.sql
new file mode 100644
index 00000000000..be6f1c2958c
--- /dev/null
+++ b/tests/queries/0_stateless/02935_parallel_replicas_settings.sql
@@ -0,0 +1,35 @@
+DROP TABLE IF EXISTS test_parallel_replicas_settings;
+CREATE TABLE test_parallel_replicas_settings (n UInt64) ENGINE=MergeTree() ORDER BY tuple();
+INSERT INTO test_parallel_replicas_settings SELECT * FROM numbers(10);
+
+SET allow_experimental_parallel_reading_from_replicas=2, max_parallel_replicas=3, parallel_replicas_for_non_replicated_merge_tree=1;
+
+SET cluster_for_parallel_replicas='';
+SELECT count() FROM test_parallel_replicas_settings WHERE NOT ignore(*); -- { serverError CLUSTER_DOESNT_EXIST }
+
+SET cluster_for_parallel_replicas='parallel_replicas';
+SELECT count() FROM test_parallel_replicas_settings WHERE NOT ignore(*) settings log_comment='0_f621c4f2-4da7-4a7c-bb6d-052c442d0f7f';
+
+SYSTEM FLUSH LOGS;
+
+SELECT count() > 0 FROM system.text_log
+WHERE yesterday() <= event_date
+      AND query_id in (select query_id from system.query_log where current_database=currentDatabase() AND log_comment='0_f621c4f2-4da7-4a7c-bb6d-052c442d0f7f')
+      AND level = 'Information'
+      AND message ILIKE '%Disabling ''use_hedged_requests'' in favor of ''allow_experimental_parallel_reading_from_replicas''%'
+SETTINGS allow_experimental_parallel_reading_from_replicas=0;
+
+SET use_hedged_requests=1;
+SELECT count() FROM test_parallel_replicas_settings WHERE NOT ignore(*) settings log_comment='1_f621c4f2-4da7-4a7c-bb6d-052c442d0f7f';
+
+SYSTEM FLUSH LOGS;
+
+SET allow_experimental_parallel_reading_from_replicas=0;
+SELECT count() > 0 FROM system.text_log
+WHERE yesterday() <= event_date
+      AND query_id in (select query_id from system.query_log where current_database = currentDatabase() AND log_comment = '1_f621c4f2-4da7-4a7c-bb6d-052c442d0f7f')
+      AND level = 'Warning'
+      AND message ILIKE '%Setting ''use_hedged_requests'' explicitly with enabled ''allow_experimental_parallel_reading_from_replicas'' has no effect%'
+SETTINGS allow_experimental_parallel_reading_from_replicas=0;
+
+DROP TABLE test_parallel_replicas_settings;
diff --git a/tests/queries/0_stateless/02940_json_array_of_unnamed_tuples_inference.reference b/tests/queries/0_stateless/02940_json_array_of_unnamed_tuples_inference.reference
new file mode 100644
index 00000000000..aac3e471264
--- /dev/null
+++ b/tests/queries/0_stateless/02940_json_array_of_unnamed_tuples_inference.reference
@@ -0,0 +1 @@
+data	Array(Tuple(Nullable(Int64), Tuple(a Nullable(Int64), b Nullable(Int64)), Nullable(Int64), Nullable(String)))					
diff --git a/tests/queries/0_stateless/02940_json_array_of_unnamed_tuples_inference.sql b/tests/queries/0_stateless/02940_json_array_of_unnamed_tuples_inference.sql
new file mode 100644
index 00000000000..a8a7af1f96c
--- /dev/null
+++ b/tests/queries/0_stateless/02940_json_array_of_unnamed_tuples_inference.sql
@@ -0,0 +1,2 @@
+desc format(JSONEachRow, '{"data" : [[1, null, 3, null], [null, {"a" : 12, "b" : 12}, null, "string"], [null, null, 4, "string"]]}');
+
diff --git a/tests/queries/0_stateless/02940_system_stacktrace_optimizations.reference b/tests/queries/0_stateless/02940_system_stacktrace_optimizations.reference
new file mode 100644
index 00000000000..f08b8ee767b
--- /dev/null
+++ b/tests/queries/0_stateless/02940_system_stacktrace_optimizations.reference
@@ -0,0 +1,5 @@
+thread = 0
+thread != 0
+Send signal to
+thread_name = 'foo'
+Send signal to 0 threads (total)
diff --git a/tests/queries/0_stateless/02940_system_stacktrace_optimizations.sh b/tests/queries/0_stateless/02940_system_stacktrace_optimizations.sh
new file mode 100755
index 00000000000..0e23bb6c42b
--- /dev/null
+++ b/tests/queries/0_stateless/02940_system_stacktrace_optimizations.sh
@@ -0,0 +1,20 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+# NOTE: due to grep "Cannot obtain a stack trace for thread {}' will be ignored automatically, which is the intention.
+
+# no message at all
+echo "thread = 0"
+$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=test -nm -q "select * from system.stack_trace where thread_id = 0" |& grep -F -o 'Send signal to'
+
+# send messages to some threads
+echo "thread != 0"
+$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=test -nm -q "select * from system.stack_trace where thread_id != 0 format Null" |& grep -F -o 'Send signal to' | grep -v 'Send signal to 0 threads (total)'
+
+# there is no thread with comm="foo", so no signals will be sent
+echo "thread_name = 'foo'"
+$CLICKHOUSE_CLIENT --allow_repeated_settings --send_logs_level=test -nm -q "select * from system.stack_trace where thread_name = 'foo' format Null" |& grep -F -o 'Send signal to 0 threads (total)'
diff --git a/tests/queries/0_stateless/02941_any_RESPECT_NULL_sparse_column.reference b/tests/queries/0_stateless/02941_any_RESPECT_NULL_sparse_column.reference
new file mode 100644
index 00000000000..573541ac970
--- /dev/null
+++ b/tests/queries/0_stateless/02941_any_RESPECT_NULL_sparse_column.reference
@@ -0,0 +1 @@
+0
diff --git a/tests/queries/0_stateless/02941_any_RESPECT_NULL_sparse_column.sql b/tests/queries/0_stateless/02941_any_RESPECT_NULL_sparse_column.sql
new file mode 100644
index 00000000000..df86b740c21
--- /dev/null
+++ b/tests/queries/0_stateless/02941_any_RESPECT_NULL_sparse_column.sql
@@ -0,0 +1,5 @@
+-- regression for the case when aggregate function will be called with from==to for sparse column
+DROP TABLE IF EXISTS data_sparse_column;
+CREATE TABLE data_sparse_column (`key` Int64, `value` Int32) ENGINE = MergeTree ORDER BY key;
+INSERT INTO data_sparse_column VALUES (1, 0);
+SELECT any(value) RESPECT NULLS FROM data_sparse_column;
diff --git a/tests/queries/0_stateless/02941_projections_external_aggregation.reference b/tests/queries/0_stateless/02941_projections_external_aggregation.reference
new file mode 100644
index 00000000000..4b1a62520cd
--- /dev/null
+++ b/tests/queries/0_stateless/02941_projections_external_aggregation.reference
@@ -0,0 +1,41 @@
+*** correct aggregation ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
+*** correct aggregation with projection ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
+*** optimize_aggregation_in_order = 0, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
+*** optimize_aggregation_in_order = 1, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
+*** after materialization ***
+*** correct aggregation ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
+*** correct aggregation with projection ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
+*** optimize_aggregation_in_order = 0, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
+*** optimize_aggregation_in_order = 1, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***
+1	0	0	1249950000
+1	0	2	1250000000
+1	1	1	1249975000
+1	1	3	1250025000
diff --git a/tests/queries/0_stateless/02941_projections_external_aggregation.sql b/tests/queries/0_stateless/02941_projections_external_aggregation.sql
new file mode 100644
index 00000000000..5053773f142
--- /dev/null
+++ b/tests/queries/0_stateless/02941_projections_external_aggregation.sql
@@ -0,0 +1,66 @@
+DROP TABLE IF EXISTS t_proj_external;
+
+CREATE TABLE t_proj_external
+(
+    k1 UInt32,
+    k2 UInt32,
+    k3 UInt32,
+    value UInt32
+)
+ENGINE = MergeTree
+ORDER BY tuple();
+
+INSERT INTO t_proj_external SELECT 1, number%2, number%4, number FROM numbers(50000);
+
+SYSTEM STOP MERGES t_proj_external;
+
+ALTER TABLE t_proj_external ADD PROJECTION aaaa (
+    SELECT
+        k1,
+        k2,
+        k3,
+        sum(value)
+    GROUP BY k1, k2, k3
+);
+
+INSERT INTO t_proj_external SELECT 1, number%2, number%4, number FROM numbers(100000) LIMIT 50000, 100000;
+
+SELECT '*** correct aggregation ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3 SETTINGS optimize_use_projections = 0;
+
+SELECT '*** correct aggregation with projection ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3;
+
+SELECT '*** optimize_aggregation_in_order = 0, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3 SETTINGS optimize_aggregation_in_order = 0, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1;
+
+SELECT '*** optimize_aggregation_in_order = 1, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3 SETTINGS optimize_aggregation_in_order = 1, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1;
+
+SYSTEM START MERGES t_proj_external;
+
+ALTER TABLE t_proj_external MATERIALIZE PROJECTION aaaa SETTINGS mutations_sync = 2;
+
+SELECT '*** after materialization ***';
+
+SELECT '*** correct aggregation ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3 SETTINGS optimize_use_projections = 0;
+
+SELECT '*** correct aggregation with projection ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3;
+
+SELECT '*** optimize_aggregation_in_order = 0, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3 SETTINGS optimize_aggregation_in_order = 0, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1;
+
+SELECT '*** optimize_aggregation_in_order = 1, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1 ***';
+
+SELECT k1, k2, k3, sum(value) v FROM t_proj_external GROUP BY k1, k2, k3 ORDER BY k1, k2, k3 SETTINGS optimize_aggregation_in_order = 1, max_bytes_before_external_group_by = 1, group_by_two_level_threshold = 1;
+
+DROP TABLE IF EXISTS t_proj_external;
diff --git a/tests/queries/0_stateless/02943_create_query_interpreter_sample_block_fix.reference b/tests/queries/0_stateless/02943_create_query_interpreter_sample_block_fix.reference
new file mode 100644
index 00000000000..a0226ef9dd7
--- /dev/null
+++ b/tests/queries/0_stateless/02943_create_query_interpreter_sample_block_fix.reference
@@ -0,0 +1,9 @@
+['0a']
+--
+['0a']
+['1a']
+--
+['0a']
+--
+['0a']
+['1a']
diff --git a/tests/queries/0_stateless/02943_create_query_interpreter_sample_block_fix.sql b/tests/queries/0_stateless/02943_create_query_interpreter_sample_block_fix.sql
new file mode 100644
index 00000000000..0262393fd48
--- /dev/null
+++ b/tests/queries/0_stateless/02943_create_query_interpreter_sample_block_fix.sql
@@ -0,0 +1,52 @@
+DROP TABLE IF EXISTS test_table;
+CREATE TABLE test_table
+(
+    number UInt64
+)
+ENGINE=MergeTree ORDER BY number;
+
+DROP VIEW IF EXISTS test_mv;
+CREATE MATERIALIZED VIEW test_mv ENGINE=MergeTree ORDER BY arr
+AS
+WITH (SELECT '\d[a-z]') AS constant_value
+SELECT extractAll(concat(toString(number), 'a'), assumeNotNull(constant_value)) AS arr
+FROM test_table;
+
+INSERT INTO test_table VALUES (0);
+SELECT * FROM test_mv ORDER BY arr;
+
+SELECT '--';
+
+INSERT INTO test_table VALUES (1);
+SELECT * FROM test_mv ORDER BY arr;
+
+SELECT '--';
+
+TRUNCATE test_table;
+
+DROP TABLE IF EXISTS regex_test_table;
+CREATE TABLE regex_test_table
+(
+    regex String
+)
+ENGINE = MergeTree ORDER BY regex;
+
+INSERT INTO regex_test_table VALUES ('\d[a-z]');
+
+DROP VIEW test_mv;
+CREATE MATERIALIZED VIEW test_mv ENGINE=MergeTree ORDER BY arr
+AS
+WITH (SELECT regex FROM regex_test_table) AS constant_value
+SELECT extractAll(concat(toString(number), 'a'), assumeNotNull(constant_value)) AS arr
+FROM test_table;
+
+INSERT INTO test_table VALUES (0);
+SELECT * FROM test_mv ORDER BY arr;
+
+SELECT '--';
+
+INSERT INTO test_table VALUES (1);
+SELECT * FROM test_mv ORDER BY arr;
+
+DROP VIEW test_mv;
+DROP TABLE test_table;
diff --git a/tests/queries/0_stateless/02943_order_by_all.reference b/tests/queries/0_stateless/02943_order_by_all.reference
new file mode 100644
index 00000000000..48d828b6924
--- /dev/null
+++ b/tests/queries/0_stateless/02943_order_by_all.reference
@@ -0,0 +1,84 @@
+-- no modifiers
+A	2
+B	3
+C	\N
+D	1
+1	D
+2	A
+3	B
+\N	C
+A	2
+B	3
+C	\N
+D	1
+1	D
+2	A
+3	B
+\N	C
+-- with ASC/DESC modifiers
+A	2
+B	3
+C	\N
+D	1
+D	1
+C	\N
+B	3
+A	2
+A	2
+B	3
+C	\N
+D	1
+D	1
+C	\N
+B	3
+A	2
+-- with NULLS FIRST/LAST modifiers
+\N	C
+1	D
+2	A
+3	B
+1	D
+2	A
+3	B
+\N	C
+\N	C
+1	D
+2	A
+3	B
+1	D
+2	A
+3	B
+\N	C
+-- what happens if some column "all" already exists?
+B	3	10
+D	1	20
+A	2	30
+C	\N	40
+B	3	10
+D	1	20
+A	2	30
+C	\N	40
+D	1
+A	2
+B	3
+C	\N
+D	1
+A	2
+B	3
+C	\N
+A 2
+B 3
+D 1
+\N
+A 2
+B 3
+D 1
+\N
+B	3	10
+D	1	20
+A	2	30
+C	\N	40
+B	3	10
+D	1	20
+A	2	30
+C	\N	40
diff --git a/tests/queries/0_stateless/02943_order_by_all.sql b/tests/queries/0_stateless/02943_order_by_all.sql
new file mode 100644
index 00000000000..0756563946c
--- /dev/null
+++ b/tests/queries/0_stateless/02943_order_by_all.sql
@@ -0,0 +1,89 @@
+-- Tests that sort expression ORDER BY ALL
+
+DROP TABLE IF EXISTS order_by_all;
+
+CREATE TABLE order_by_all
+(
+    a String,
+    b Nullable(Int32),
+    all UInt64,
+)
+ENGINE = Memory;
+
+INSERT INTO order_by_all VALUES ('B', 3, 10), ('C', NULL, 40), ('D', 1, 20), ('A', 2, 30);
+
+SELECT '-- no modifiers';
+
+SET allow_experimental_analyzer = 0;
+SELECT a, b FROM order_by_all ORDER BY ALL;
+SELECT b, a FROM order_by_all ORDER BY ALL;
+
+SET allow_experimental_analyzer = 1;
+SELECT a, b FROM order_by_all ORDER BY ALL;
+SELECT b, a FROM order_by_all ORDER BY ALL;
+
+SELECT '-- with ASC/DESC modifiers';
+
+SET allow_experimental_analyzer = 0;
+SELECT a, b FROM order_by_all ORDER BY ALL ASC;
+SELECT a, b FROM order_by_all ORDER BY ALL DESC;
+
+SET allow_experimental_analyzer = 1;
+SELECT a, b FROM order_by_all ORDER BY ALL ASC;
+SELECT a, b FROM order_by_all ORDER BY ALL DESC;
+
+SELECT '-- with NULLS FIRST/LAST modifiers';
+
+SET allow_experimental_analyzer = 0;
+SELECT b, a FROM order_by_all ORDER BY ALL NULLS FIRST;
+SELECT b, a FROM order_by_all ORDER BY ALL NULLS LAST;
+
+SET allow_experimental_analyzer = 1;
+SELECT b, a FROM order_by_all ORDER BY ALL NULLS FIRST;
+SELECT b, a FROM order_by_all ORDER BY ALL NULLS LAST;
+
+SELECT '-- what happens if some column "all" already exists?';
+
+-- columns
+
+SET allow_experimental_analyzer = 0;
+SELECT a, b, all FROM order_by_all ORDER BY all;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b, all FROM order_by_all ORDER BY ALL;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b, all FROM order_by_all ORDER BY all SETTINGS enable_order_by_all = false;
+
+SET allow_experimental_analyzer = 1;
+SELECT a, b, all FROM order_by_all ORDER BY all;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b, all FROM order_by_all ORDER BY ALL;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b, all FROM order_by_all ORDER BY all SETTINGS enable_order_by_all = false;
+
+-- column aliases
+
+SET allow_experimental_analyzer = 0;
+SELECT a, b AS all FROM order_by_all ORDER BY all;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b AS all FROM order_by_all ORDER BY ALL;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b AS all FROM order_by_all ORDER BY all SETTINGS enable_order_by_all = false;
+
+SET allow_experimental_analyzer = 1;
+SELECT a, b AS all FROM order_by_all ORDER BY all;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b AS all FROM order_by_all ORDER BY ALL;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT a, b AS all FROM order_by_all ORDER BY all SETTINGS enable_order_by_all = false;
+
+-- expressions
+
+SET allow_experimental_analyzer = 0;
+SELECT format('{} {}', a, b) AS all FROM order_by_all ORDER BY all;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT format('{} {}', a, b) AS all FROM order_by_all ORDER BY ALL;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT format('{} {}', a, b) AS all FROM order_by_all ORDER BY all SETTINGS enable_order_by_all = false;
+
+SET allow_experimental_analyzer = 1;
+SELECT format('{} {}', a, b) AS all FROM order_by_all ORDER BY all;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT format('{} {}', a, b) AS all FROM order_by_all ORDER BY ALL;  -- { serverError UNEXPECTED_EXPRESSION }
+SELECT format('{} {}', a, b) AS all FROM order_by_all ORDER BY all SETTINGS enable_order_by_all = false;
+
+SET allow_experimental_analyzer = 0;
+SELECT a, b, all FROM order_by_all ORDER BY all, a;
+
+SET allow_experimental_analyzer = 1;
+SELECT a, b, all FROM order_by_all ORDER BY all, a;
+
+DROP TABLE order_by_all;
diff --git a/tests/queries/0_stateless/02943_positional_arguments_bugs.reference b/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
new file mode 100644
index 00000000000..702e1261186
--- /dev/null
+++ b/tests/queries/0_stateless/02943_positional_arguments_bugs.reference
@@ -0,0 +1,2 @@
+45	1
+processed	99	0
diff --git a/tests/queries/0_stateless/02943_positional_arguments_bugs.sql b/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
new file mode 100644
index 00000000000..b8cf73da42d
--- /dev/null
+++ b/tests/queries/0_stateless/02943_positional_arguments_bugs.sql
@@ -0,0 +1,23 @@
+-- https://github.com/ClickHouse/ClickHouse/issues/46628
+DROP TABLE IF EXISTS t;
+CREATE TABLE t
+(
+    `n` int
+)
+    ENGINE = MergeTree
+        ORDER BY n AS
+SELECT *
+FROM numbers(10);
+
+SELECT
+    sum(n),
+    1 AS x
+FROM t
+GROUP BY x;
+
+SELECT
+    'processed' AS type,
+    max(number) AS max_date,
+    min(number) AS min_date
+FROM numbers(100)
+GROUP BY type;
diff --git a/tests/queries/0_stateless/02943_use_full_text_skip_index_with_has_any.reference b/tests/queries/0_stateless/02943_use_full_text_skip_index_with_has_any.reference
new file mode 100644
index 00000000000..a561f33b324
--- /dev/null
+++ b/tests/queries/0_stateless/02943_use_full_text_skip_index_with_has_any.reference
@@ -0,0 +1,17 @@
+1	['this is a test','example.com']
+--
+1	['this is a test','example.com']
+--
+2	['another test','another example']
+--
+1	['this is a test','example.com']
+2	['another test','another example']
+--
+1	['this is a test','example.com']
+--
+1	['this is a test','example.com']
+--
+2	['another test','another example']
+--
+1	['this is a test','example.com']
+2	['another test','another example']
diff --git a/tests/queries/0_stateless/02943_use_full_text_skip_index_with_has_any.sql b/tests/queries/0_stateless/02943_use_full_text_skip_index_with_has_any.sql
new file mode 100644
index 00000000000..f1a3833f640
--- /dev/null
+++ b/tests/queries/0_stateless/02943_use_full_text_skip_index_with_has_any.sql
@@ -0,0 +1,39 @@
+DROP TABLE IF EXISTS tokenbf_v1_hasany_test;
+DROP TABLE IF EXISTS ngrambf_v1_hasany_test;
+
+CREATE TABLE tokenbf_v1_hasany_test
+(
+    id UInt32,
+    array Array(String),
+    INDEX idx_array_tokenbf_v1 array TYPE tokenbf_v1(512,3,0) GRANULARITY 1,
+) Engine=MergeTree() ORDER BY id SETTINGS index_granularity = 1;
+
+CREATE TABLE ngrambf_v1_hasany_test
+(
+    id UInt32,
+    array Array(String),
+    INDEX idx_array_ngrambf_v1 array TYPE ngrambf_v1(3,512,3,0) GRANULARITY 1,
+) Engine=MergeTree() ORDER BY id SETTINGS index_granularity = 1;
+
+INSERT INTO tokenbf_v1_hasany_test VALUES (1, ['this is a test', 'example.com']), (2, ['another test', 'another example']);
+INSERT INTO ngrambf_v1_hasany_test VALUES (1, ['this is a test', 'example.com']), (2, ['another test', 'another example']);
+
+SELECT * FROM tokenbf_v1_hasany_test WHERE hasAny(array, ['this is a test']) SETTINGS force_data_skipping_indices='idx_array_tokenbf_v1';
+SELECT '--';
+SELECT * FROM tokenbf_v1_hasany_test WHERE hasAny(array, ['example.com']) SETTINGS force_data_skipping_indices='idx_array_tokenbf_v1';
+SELECT '--';
+SELECT * FROM tokenbf_v1_hasany_test WHERE hasAny(array, ['another test']) SETTINGS force_data_skipping_indices='idx_array_tokenbf_v1';
+SELECT '--';
+SELECT * FROM tokenbf_v1_hasany_test WHERE hasAny(array, ['another example', 'example.com']) ORDER BY id ASC SETTINGS force_data_skipping_indices='idx_array_tokenbf_v1';
+SELECT '--';
+
+SELECT * FROM ngrambf_v1_hasany_test WHERE hasAny(array, ['this is a test']) SETTINGS force_data_skipping_indices='idx_array_ngrambf_v1';
+SELECT '--';
+SELECT * FROM ngrambf_v1_hasany_test WHERE hasAny(array, ['example.com']) SETTINGS force_data_skipping_indices='idx_array_ngrambf_v1';
+SELECT '--';
+SELECT * FROM ngrambf_v1_hasany_test WHERE hasAny(array, ['another test']) SETTINGS force_data_skipping_indices='idx_array_ngrambf_v1';
+SELECT '--';
+SELECT * FROM ngrambf_v1_hasany_test WHERE hasAny(array, ['another example', 'example.com']) ORDER BY id ASC SETTINGS force_data_skipping_indices='idx_array_ngrambf_v1';
+
+DROP TABLE tokenbf_v1_hasany_test;
+DROP TABLE ngrambf_v1_hasany_test;
diff --git a/tests/queries/0_stateless/02944_dynamically_change_filesystem_cache_size.reference b/tests/queries/0_stateless/02944_dynamically_change_filesystem_cache_size.reference
new file mode 100644
index 00000000000..4a6bc8498e1
--- /dev/null
+++ b/tests/queries/0_stateless/02944_dynamically_change_filesystem_cache_size.reference
@@ -0,0 +1,20 @@
+100	10	10	10	0	0	0	0	/var/lib/clickhouse/filesystem_caches/s3_cache_02944/	5	5000	0	16
+0
+10
+98
+set max_size from 100 to 10
+10	10	10	10	0	0	8	1	/var/lib/clickhouse/filesystem_caches/s3_cache_02944/	5	5000	0	16
+1
+8
+set max_size from 10 to 100
+100	10	10	10	0	0	8	1	/var/lib/clickhouse/filesystem_caches/s3_cache_02944/	5	5000	0	16
+10
+98
+set max_elements from 10 to 2
+100	2	10	10	0	0	18	2	/var/lib/clickhouse/filesystem_caches/s3_cache_02944/	5	5000	0	16
+2
+18
+set max_elements from 2 to 10
+100	10	10	10	0	0	18	2	/var/lib/clickhouse/filesystem_caches/s3_cache_02944/	5	5000	0	16
+10
+98
diff --git a/tests/queries/0_stateless/02944_dynamically_change_filesystem_cache_size.sh b/tests/queries/0_stateless/02944_dynamically_change_filesystem_cache_size.sh
new file mode 100755
index 00000000000..2e344a6b6e5
--- /dev/null
+++ b/tests/queries/0_stateless/02944_dynamically_change_filesystem_cache_size.sh
@@ -0,0 +1,88 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest, no-parallel, no-s3-storage, no-random-settings
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+disk_name="s3_cache_02944"
+
+$CLICKHOUSE_CLIENT --query "SYSTEM DROP FILESYSTEM CACHE"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+$CLICKHOUSE_CLIENT -nm --query "
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (a String) engine=MergeTree() ORDER BY tuple() SETTINGS disk = '$disk_name';
+INSERT INTO test SELECT randomString(100);
+SYSTEM DROP FILESYSTEM CACHE;
+"
+
+$CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+
+$CLICKHOUSE_CLIENT --query "SELECT * FROM test FORMAT Null"
+
+$CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+$CLICKHOUSE_CLIENT --query "SELECT sum(size) FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+
+config_path=/etc/clickhouse-server/config.d/storage_conf_02944.xml
+config_path_tmp=$config_path.tmp
+
+echo 'set max_size from 100 to 10'
+cat $config_path \
+| sed "s|<max_size>100<\/max_size>|<max_size>10<\/max_size>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT -nm --query "
+set send_logs_level='fatal';
+SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+$CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+$CLICKHOUSE_CLIENT --query "SELECT sum(size) FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+
+echo 'set max_size from 10 to 100'
+cat $config_path \
+| sed "s|<max_size>10<\/max_size>|<max_size>100<\/max_size>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT -nm --query "
+set send_logs_level='fatal';
+SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+$CLICKHOUSE_CLIENT --query "SELECT * FROM test FORMAT Null"
+
+$CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+$CLICKHOUSE_CLIENT --query "SELECT sum(size) FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+
+echo 'set max_elements from 10 to 2'
+cat $config_path \
+| sed "s|<max_elements>10<\/max_elements>|<max_elements>2<\/max_elements>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT -nm --query "
+set send_logs_level='fatal';
+SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+$CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+$CLICKHOUSE_CLIENT --query "SELECT sum(size) FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+
+echo 'set max_elements from 2 to 10'
+cat $config_path \
+| sed "s|<max_elements>2<\/max_elements>|<max_elements>10<\/max_elements>|" \
+> $config_path_tmp
+mv $config_path_tmp $config_path
+
+$CLICKHOUSE_CLIENT -nm --query "
+set send_logs_level='fatal';
+SYSTEM RELOAD CONFIG"
+$CLICKHOUSE_CLIENT --query "DESCRIBE FILESYSTEM CACHE '${disk_name}'"
+
+$CLICKHOUSE_CLIENT --query "SELECT * FROM test FORMAT Null"
+
+$CLICKHOUSE_CLIENT --query "SELECT count() FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
+$CLICKHOUSE_CLIENT --query "SELECT sum(size) FROM system.filesystem_cache WHERE state = 'DOWNLOADED'"
diff --git a/tests/queries/0_stateless/02945_blake3_msan.reference b/tests/queries/0_stateless/02945_blake3_msan.reference
new file mode 100644
index 00000000000..5c446c39f9b
--- /dev/null
+++ b/tests/queries/0_stateless/02945_blake3_msan.reference
@@ -0,0 +1 @@
+95066D9DCEB0F4D60F229EF14F6FD26E692C21E480A582808975E55E39BEE1A6
diff --git a/tests/queries/0_stateless/02945_blake3_msan.sql b/tests/queries/0_stateless/02945_blake3_msan.sql
new file mode 100644
index 00000000000..cad9b6292dd
--- /dev/null
+++ b/tests/queries/0_stateless/02945_blake3_msan.sql
@@ -0,0 +1,3 @@
+-- Tags: no-fasttest
+-- https://github.com/ClickHouse/ClickHouse/issues/57810
+SELECT hex(BLAKE3(BLAKE3('a')));
diff --git a/tests/queries/0_stateless/02946_literal_alias_misclassification.reference b/tests/queries/0_stateless/02946_literal_alias_misclassification.reference
new file mode 100644
index 00000000000..d8e5a437352
--- /dev/null
+++ b/tests/queries/0_stateless/02946_literal_alias_misclassification.reference
@@ -0,0 +1,2 @@
+const	1
+const	2
diff --git a/tests/queries/0_stateless/02946_literal_alias_misclassification.sql b/tests/queries/0_stateless/02946_literal_alias_misclassification.sql
new file mode 100644
index 00000000000..0d001bf1e4c
--- /dev/null
+++ b/tests/queries/0_stateless/02946_literal_alias_misclassification.sql
@@ -0,0 +1,24 @@
+DROP TABLE IF EXISTS literal_alias_misclassification;
+
+CREATE TABLE literal_alias_misclassification
+(
+    `id` Int64,
+    `a` Nullable(String),
+    `b` Nullable(Int64)
+)
+ENGINE = MergeTree
+ORDER BY id;
+
+
+INSERT INTO literal_alias_misclassification values(1, 'a', 1);
+INSERT INTO literal_alias_misclassification values(2, 'b', 2);
+
+SELECT 'const' AS r, b 
+FROM
+  ( SELECT a AS r, b FROM literal_alias_misclassification ) AS t1
+  LEFT JOIN
+  ( SELECT a AS r FROM literal_alias_misclassification ) AS t2 
+  ON t1.r = t2.r
+ORDER BY b;
+
+DROP TABLE IF EXISTS literal_alias_misclassification;
diff --git a/tests/queries/0_stateless/02946_merge_tree_final_split_ranges_by_primary_key.reference b/tests/queries/0_stateless/02946_merge_tree_final_split_ranges_by_primary_key.reference
new file mode 100644
index 00000000000..59acae1c7ef
--- /dev/null
+++ b/tests/queries/0_stateless/02946_merge_tree_final_split_ranges_by_primary_key.reference
@@ -0,0 +1,85 @@
+1
+--
+0	0
+1	1
+2	2
+3	3
+4	4
+5	5
+6	6
+7	7
+8	8
+9	9
+10	10
+11	11
+12	12
+13	13
+14	14
+15	15
+--
+0	0
+1	1
+2	2
+3	3
+4	4
+5	5
+6	6
+7	7
+8	8
+9	9
+10	10
+11	11
+12	12
+13	13
+14	14
+15	15
+--
+0	0
+1	1
+2	2
+3	3
+4	4
+5	5
+6	6
+7	7
+8	8
+9	9
+10	10
+11	11
+12	12
+13	13
+14	14
+15	15
+--
+0	0
+1	1
+2	2
+3	3
+4	4
+5	5
+6	6
+7	7
+8	8
+9	9
+10	10
+11	11
+12	12
+13	13
+14	14
+15	15
+16	16
+17	17
+18	18
+19	19
+20	20
+21	21
+22	22
+23	23
+24	24
+25	25
+26	26
+27	27
+28	28
+29	29
+30	30
+31	31
diff --git a/tests/queries/0_stateless/02946_merge_tree_final_split_ranges_by_primary_key.sql b/tests/queries/0_stateless/02946_merge_tree_final_split_ranges_by_primary_key.sql
new file mode 100644
index 00000000000..780ed5b7984
--- /dev/null
+++ b/tests/queries/0_stateless/02946_merge_tree_final_split_ranges_by_primary_key.sql
@@ -0,0 +1,34 @@
+DROP TABLE IF EXISTS test_table;
+CREATE TABLE test_table
+(
+    id UInt64,
+    value String
+) ENGINE=ReplacingMergeTree ORDER BY id SETTINGS index_granularity = 2;
+
+INSERT INTO test_table SELECT 0, '0';
+INSERT INTO test_table SELECT number + 1, number + 1 FROM numbers(15);
+OPTIMIZE TABLE test_table;
+
+SELECT COUNT() FROM system.parts WHERE database = currentDatabase() AND table = 'test_table' AND active = 1;
+SYSTEM STOP MERGES test_table;
+
+SELECT '--';
+
+SELECT id, value FROM test_table FINAL ORDER BY id;
+
+SELECT '--';
+
+INSERT INTO test_table SELECT 5, '5';
+SELECT id, value FROM test_table FINAL ORDER BY id;
+
+SELECT '--';
+
+INSERT INTO test_table SELECT number + 8, number + 8 FROM numbers(8);
+SELECT id, value FROM test_table FINAL ORDER BY id;
+
+SELECT '--';
+
+INSERT INTO test_table SELECT number, number FROM numbers(32);
+SELECT id, value FROM test_table FINAL ORDER BY id;
+
+DROP TABLE test_table;
diff --git a/tests/queries/0_stateless/02946_parallel_replicas_distributed.reference b/tests/queries/0_stateless/02946_parallel_replicas_distributed.reference
new file mode 100644
index 00000000000..ea4483ec305
--- /dev/null
+++ b/tests/queries/0_stateless/02946_parallel_replicas_distributed.reference
@@ -0,0 +1 @@
+100	4950
diff --git a/tests/queries/0_stateless/02946_parallel_replicas_distributed.sql b/tests/queries/0_stateless/02946_parallel_replicas_distributed.sql
new file mode 100644
index 00000000000..1afd4ff0192
--- /dev/null
+++ b/tests/queries/0_stateless/02946_parallel_replicas_distributed.sql
@@ -0,0 +1,17 @@
+DROP TABLE IF EXISTS test;
+DROP TABLE IF EXISTS test_d;
+
+CREATE TABLE test (id UInt64, date Date)
+ENGINE = MergeTree
+ORDER BY id
+AS select *, '2023-12-25' from numbers(100);
+
+CREATE TABLE IF NOT EXISTS test_d as test
+ENGINE = Distributed(test_cluster_one_shard_three_replicas_localhost, currentDatabase(), test);
+
+SELECT count(), sum(id)
+FROM test_d
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1;
+
+DROP TABLE test_d;
+DROP TABLE test;
diff --git a/tests/queries/0_stateless/02946_parallel_replicas_force_primary_key.reference b/tests/queries/0_stateless/02946_parallel_replicas_force_primary_key.reference
new file mode 100644
index 00000000000..64dfee7b7a1
--- /dev/null
+++ b/tests/queries/0_stateless/02946_parallel_replicas_force_primary_key.reference
@@ -0,0 +1,6 @@
+1	750
+2	750
+3	750
+1	750
+2	750
+3	750
diff --git a/tests/queries/0_stateless/02946_parallel_replicas_force_primary_key.sql b/tests/queries/0_stateless/02946_parallel_replicas_force_primary_key.sql
new file mode 100644
index 00000000000..d33c8cdbc93
--- /dev/null
+++ b/tests/queries/0_stateless/02946_parallel_replicas_force_primary_key.sql
@@ -0,0 +1,49 @@
+DROP TABLE IF EXISTS t1 SYNC;
+DROP TABLE IF EXISTS t2 SYNC;
+DROP TABLE IF EXISTS t3 SYNC;
+
+CREATE TABLE t1(k UInt32, v String) ENGINE ReplicatedMergeTree('/02946_parallel_replicas/{database}/test_tbl', 'r1') ORDER BY k;
+CREATE TABLE t2(k UInt32, v String) ENGINE ReplicatedMergeTree('/02946_parallel_replicas/{database}/test_tbl', 'r2') ORDER BY k;
+CREATE TABLE t3(k UInt32, v String) ENGINE ReplicatedMergeTree('/02946_parallel_replicas/{database}/test_tbl', 'r3') ORDER BY k;
+
+insert into t1 select number % 4, toString(number) from numbers(1000, 1000);
+insert into t2 select number % 4, toString(number) from numbers(2000, 1000);
+insert into t3 select number % 4, toString(number) from numbers(3000, 1000);
+
+system sync replica t1;
+system sync replica t2;
+system sync replica t3;
+
+-- w/o parallel replicas
+SELECT
+    k,
+    count()
+FROM t1
+WHERE k > 0
+GROUP BY k
+ORDER BY k
+SETTINGS force_primary_key = 1, allow_experimental_parallel_reading_from_replicas = 0;
+
+-- parallel replicas, primary key is used
+SET allow_experimental_parallel_reading_from_replicas=1, max_parallel_replicas=3, cluster_for_parallel_replicas='test_cluster_one_shard_three_replicas_localhost';
+SELECT
+    k,
+    count()
+FROM t1
+WHERE k > 0
+GROUP BY k
+ORDER BY k
+SETTINGS force_primary_key = 1;
+
+-- parallel replicas, primary key is NOT used
+SELECT
+    k,
+    count()
+FROM t1
+GROUP BY k
+ORDER BY k
+SETTINGS force_primary_key = 1; -- { serverError INDEX_NOT_USED }
+
+DROP TABLE t1 SYNC;
+DROP TABLE t2 SYNC;
+DROP TABLE t3 SYNC;
diff --git a/tests/queries/0_stateless/02947_non_post_request_should_be_readonly.reference b/tests/queries/0_stateless/02947_non_post_request_should_be_readonly.reference
new file mode 100644
index 00000000000..9cdea62b413
--- /dev/null
+++ b/tests/queries/0_stateless/02947_non_post_request_should_be_readonly.reference
@@ -0,0 +1,2 @@
+Cannot execute query in readonly mode
+Internal Server Error
diff --git a/tests/queries/0_stateless/02947_non_post_request_should_be_readonly.sh b/tests/queries/0_stateless/02947_non_post_request_should_be_readonly.sh
new file mode 100755
index 00000000000..4250799b522
--- /dev/null
+++ b/tests/queries/0_stateless/02947_non_post_request_should_be_readonly.sh
@@ -0,0 +1,16 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+# This should fail
+${CLICKHOUSE_CURL} -X GET -sS "${CLICKHOUSE_URL}&session_id=${SESSION_ID}&query=CREATE+DATABASE+non_post_request_test" | grep -o "Cannot execute query in readonly mode"
+
+# This should fail
+${CLICKHOUSE_CURL} --head -sS "${CLICKHOUSE_URL}&session_id=${SESSION_ID}&query=CREATE+DATABASE+non_post_request_test" | grep -o "Internal Server Error"
+
+# This should pass - but will throw error "non_post_request_test already exists" if the database was created by any of the above requests.
+${CLICKHOUSE_CURL} -X POST -sS "${CLICKHOUSE_URL}&session_id=${SESSION_ID}" -d 'CREATE DATABASE non_post_request_test'
+${CLICKHOUSE_CURL} -X POST -sS "${CLICKHOUSE_URL}&session_id=${SESSION_ID}" -d 'DROP DATABASE non_post_request_test'
diff --git a/tests/queries/0_stateless/02947_parallel_replicas_remote.reference b/tests/queries/0_stateless/02947_parallel_replicas_remote.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02947_parallel_replicas_remote.sql b/tests/queries/0_stateless/02947_parallel_replicas_remote.sql
new file mode 100644
index 00000000000..345d9f9cb03
--- /dev/null
+++ b/tests/queries/0_stateless/02947_parallel_replicas_remote.sql
@@ -0,0 +1,12 @@
+DROP TABLE IF EXISTS test;
+
+CREATE TABLE test (id UInt64, date Date)
+ENGINE = MergeTree
+ORDER BY id
+AS select *, '2023-12-25' from numbers(100);
+
+SELECT count(), sum(id)
+FROM remote('127.0.0.1|127.0.0.2|127.0.0.3|127.0.0.4', currentDatabase(), test)
+SETTINGS allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 4, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree = 1; -- { serverError CLUSTER_DOESNT_EXIST }
+
+DROP TABLE test;
diff --git a/tests/queries/0_stateless/02949_parallel_replicas_in_subquery.reference b/tests/queries/0_stateless/02949_parallel_replicas_in_subquery.reference
new file mode 100644
index 00000000000..4d33751c699
--- /dev/null
+++ b/tests/queries/0_stateless/02949_parallel_replicas_in_subquery.reference
@@ -0,0 +1,8 @@
+---
+2	test2	8
+3	test3	8
+4	test4	1985
+---
+1	test1	42
+---
+3	test3
diff --git a/tests/queries/0_stateless/02949_parallel_replicas_in_subquery.sql b/tests/queries/0_stateless/02949_parallel_replicas_in_subquery.sql
new file mode 100644
index 00000000000..53b8a761cda
--- /dev/null
+++ b/tests/queries/0_stateless/02949_parallel_replicas_in_subquery.sql
@@ -0,0 +1,26 @@
+DROP TABLE IF EXISTS merge_tree_in_subqueries;
+CREATE TABLE merge_tree_in_subqueries (id UInt64, name String, num UInt64) ENGINE = MergeTree ORDER BY (id, name);
+INSERT INTO merge_tree_in_subqueries VALUES(1, 'test1', 42);
+INSERT INTO merge_tree_in_subqueries VALUES(2, 'test2', 8);
+INSERT INTO merge_tree_in_subqueries VALUES(3, 'test3', 8);
+INSERT INTO merge_tree_in_subqueries VALUES(4, 'test4', 1985);
+INSERT INTO merge_tree_in_subqueries VALUES(5, 'test5', 0);
+
+SET max_parallel_replicas=3, cluster_for_parallel_replicas='test_cluster_one_shard_three_replicas_localhost', parallel_replicas_for_non_replicated_merge_tree=1;
+
+SELECT * FROM merge_tree_in_subqueries WHERE id IN (SELECT * FROM system.numbers LIMIT 0) SETTINGS allow_experimental_parallel_reading_from_replicas=2; -- { serverError SUPPORT_IS_DISABLED }
+SELECT * FROM merge_tree_in_subqueries WHERE id IN (SELECT * FROM system.numbers LIMIT 0) SETTINGS allow_experimental_parallel_reading_from_replicas=1;
+
+SELECT '---';
+SELECT * FROM merge_tree_in_subqueries WHERE id IN (SELECT * FROM system.numbers LIMIT 2, 3) ORDER BY id SETTINGS allow_experimental_parallel_reading_from_replicas=2; -- { serverError SUPPORT_IS_DISABLED };
+SELECT * FROM merge_tree_in_subqueries WHERE id IN (SELECT * FROM system.numbers LIMIT 2, 3) ORDER BY id SETTINGS allow_experimental_parallel_reading_from_replicas=1;
+
+SELECT '---';
+SELECT * FROM merge_tree_in_subqueries WHERE id IN (SELECT 1) ORDER BY id SETTINGS allow_experimental_parallel_reading_from_replicas=2; -- { serverError SUPPORT_IS_DISABLED };
+SELECT * FROM merge_tree_in_subqueries WHERE id IN (SELECT 1) ORDER BY id SETTINGS allow_experimental_parallel_reading_from_replicas=1;
+
+-- IN with tuples is allowed
+SELECT '---';
+SELECT id, name FROM merge_tree_in_subqueries WHERE (id, name)  IN (3, 'test3') SETTINGS allow_experimental_parallel_reading_from_replicas=2;
+
+DROP TABLE IF EXISTS merge_tree_in_subqueries;
diff --git a/tests/queries/0_stateless/02949_parallel_replicas_scalar_subquery_big_integer.reference b/tests/queries/0_stateless/02949_parallel_replicas_scalar_subquery_big_integer.reference
new file mode 100644
index 00000000000..97bd2c20556
--- /dev/null
+++ b/tests/queries/0_stateless/02949_parallel_replicas_scalar_subquery_big_integer.reference
@@ -0,0 +1 @@
+6	111111111111111111111111111111111111111
diff --git a/tests/queries/0_stateless/02949_parallel_replicas_scalar_subquery_big_integer.sql b/tests/queries/0_stateless/02949_parallel_replicas_scalar_subquery_big_integer.sql
new file mode 100644
index 00000000000..26f87180ab2
--- /dev/null
+++ b/tests/queries/0_stateless/02949_parallel_replicas_scalar_subquery_big_integer.sql
@@ -0,0 +1,9 @@
+DROP TABLE IF EXISTS test;
+CREATE TABLE test (x UInt8) ENGINE = MergeTree ORDER BY x;
+INSERT INTO test VALUES (1), (2), (3);
+
+SET allow_experimental_parallel_reading_from_replicas = 1, max_parallel_replicas = 2, cluster_for_parallel_replicas = 'test_cluster_one_shard_three_replicas_localhost', prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree = 1;
+
+WITH (SELECT '111111111111111111111111111111111111111'::UInt128) AS v SELECT sum(x), max(v) FROM test;
+
+DROP TABLE test;
diff --git a/tests/queries/0_stateless/02949_ttl_group_by_bug.reference b/tests/queries/0_stateless/02949_ttl_group_by_bug.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02949_ttl_group_by_bug.sql b/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
new file mode 100644
index 00000000000..2888f6e7d66
--- /dev/null
+++ b/tests/queries/0_stateless/02949_ttl_group_by_bug.sql
@@ -0,0 +1,29 @@
+DROP TABLE IF EXISTS ttl_group_by_bug;
+
+CREATE TABLE ttl_group_by_bug
+(key UInt32, ts DateTime, value UInt32, min_value UInt32 default value, max_value UInt32 default value)
+ENGINE = MergeTree() PARTITION BY toYYYYMM(ts)
+ORDER BY (key, toStartOfInterval(ts, toIntervalMinute(3)), ts)
+TTL ts + INTERVAL 5 MINUTE GROUP BY key, toStartOfInterval(ts, toIntervalMinute(3))
+SET value = sum(value), min_value = min(min_value), max_value = max(max_value),  ts=min(toStartOfInterval(ts, toIntervalMinute(3)));
+
+INSERT INTO ttl_group_by_bug(key, ts, value) SELECT number%5 as key, now() - interval 10 minute + number, 0 FROM numbers(1000);
+
+OPTIMIZE TABLE ttl_group_by_bug FINAL;
+
+SELECT *
+FROM
+(
+    SELECT
+        _part,
+        rowNumberInAllBlocks(),
+        (key, toStartOfInterval(ts, toIntervalMinute(3)), ts) AS cur,
+        lagInFrame((key, toStartOfInterval(ts, toIntervalMinute(3)), ts), 1) OVER () AS prev,
+        1
+    FROM ttl_group_by_bug
+)
+WHERE cur < prev
+LIMIT 2
+SETTINGS max_threads = 1;
+
+DROP TABLE IF EXISTS ttl_group_by_bug;
diff --git a/tests/queries/0_stateless/02950_obfuscator_keywords_more.reference b/tests/queries/0_stateless/02950_obfuscator_keywords_more.reference
new file mode 100644
index 00000000000..7c3fcea85ea
--- /dev/null
+++ b/tests/queries/0_stateless/02950_obfuscator_keywords_more.reference
@@ -0,0 +1 @@
+CREATE TABLE test (pill DateTime('UTC'), tart DateTime('Europe/Amsterdam')) ENGINE = ReplicatedVersionedCollapsingMergeTree ORDER BY pill SETTINGS index_granularity = 15414;
diff --git a/tests/queries/0_stateless/02950_obfuscator_keywords_more.sh b/tests/queries/0_stateless/02950_obfuscator_keywords_more.sh
new file mode 100755
index 00000000000..fb0e7c178e2
--- /dev/null
+++ b/tests/queries/0_stateless/02950_obfuscator_keywords_more.sh
@@ -0,0 +1,9 @@
+#!/usr/bin/env bash
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+obf="$CLICKHOUSE_FORMAT --obfuscate"
+
+echo "CREATE TABLE test (secret1 DateTime('UTC'), secret2 DateTime('Europe/Amsterdam')) ENGINE = ReplicatedVersionedCollapsingMergeTree ORDER BY secret1 SETTINGS index_granularity = 8192;" | $obf
diff --git a/tests/queries/0_stateless/02950_parallel_replicas_used_count.reference b/tests/queries/0_stateless/02950_parallel_replicas_used_count.reference
new file mode 100644
index 00000000000..21b7b527b7a
--- /dev/null
+++ b/tests/queries/0_stateless/02950_parallel_replicas_used_count.reference
@@ -0,0 +1,8 @@
+100	4950
+1
+89
+90
+91
+92
+93
+1
diff --git a/tests/queries/0_stateless/02950_parallel_replicas_used_count.sql b/tests/queries/0_stateless/02950_parallel_replicas_used_count.sql
new file mode 100644
index 00000000000..22f55acd365
--- /dev/null
+++ b/tests/queries/0_stateless/02950_parallel_replicas_used_count.sql
@@ -0,0 +1,25 @@
+DROP TABLE IF EXISTS test;
+
+CREATE TABLE test (k UInt64, v String)
+ENGINE = MergeTree
+ORDER BY k;
+
+INSERT INTO test SELECT number, toString(number) FROM numbers(100);
+
+SET allow_experimental_parallel_reading_from_replicas = 2, max_parallel_replicas = 3, prefer_localhost_replica = 0, parallel_replicas_for_non_replicated_merge_tree=1, cluster_for_parallel_replicas='test_cluster_one_shard_three_replicas_localhost';
+
+-- default coordinator
+SELECT count(), sum(k)
+FROM test
+SETTINGS log_comment = '02950_parallel_replicas_used_replicas_count';
+
+SYSTEM FLUSH LOGS;
+SELECT ProfileEvents['ParallelReplicasUsedCount'] FROM system.query_log WHERE type = 'QueryFinish' AND query_id IN (SELECT query_id FROM system.query_log WHERE current_database = currentDatabase() AND log_comment = '02950_parallel_replicas_used_replicas_count' AND type = 'QueryFinish' AND initial_query_id = query_id)  SETTINGS allow_experimental_parallel_reading_from_replicas=0;
+
+-- In order coordinator
+SELECT k FROM test order by k limit 5 offset 89 SETTINGS optimize_read_in_order=1, log_comment='02950_parallel_replicas_used_replicas_count_2';
+
+SYSTEM FLUSH LOGS;
+SELECT ProfileEvents['ParallelReplicasUsedCount'] FROM system.query_log WHERE type = 'QueryFinish' AND query_id IN (SELECT query_id FROM system.query_log WHERE current_database = currentDatabase() AND log_comment = '02950_parallel_replicas_used_replicas_count_2' AND type = 'QueryFinish' AND initial_query_id = query_id)  SETTINGS allow_experimental_parallel_reading_from_replicas=0;
+
+DROP TABLE test;
diff --git a/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.reference b/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.reference
new file mode 100644
index 00000000000..abdcc960be3
--- /dev/null
+++ b/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.reference
@@ -0,0 +1,7 @@
+NewPart	part_log_bytes_uncompressed	all_1_1_0	1	1
+MergeParts	part_log_bytes_uncompressed	all_1_2_1	1	1
+MutatePart	part_log_bytes_uncompressed	all_1_2_1_3	1	1
+NewPart	part_log_bytes_uncompressed	all_2_2_0	1	1
+NewPart	part_log_bytes_uncompressed	all_4_4_0	1	1
+RemovePart	part_log_bytes_uncompressed	all_4_4_0	1	1
+NewPart	part_log_bytes_uncompressed	all_4_4_1	0	0
diff --git a/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql b/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql
new file mode 100644
index 00000000000..0c2cef6e004
--- /dev/null
+++ b/tests/queries/0_stateless/02950_part_log_bytes_uncompressed.sql
@@ -0,0 +1,24 @@
+CREATE TABLE part_log_bytes_uncompressed (
+    key UInt8,
+    value UInt8
+)
+Engine=MergeTree()
+ORDER BY key;
+
+INSERT INTO part_log_bytes_uncompressed SELECT 1, 1 FROM numbers(1000);
+INSERT INTO part_log_bytes_uncompressed SELECT 2, 1 FROM numbers(1000);
+
+OPTIMIZE TABLE part_log_bytes_uncompressed FINAL;
+
+ALTER TABLE part_log_bytes_uncompressed UPDATE value = 3 WHERE 1 = 1 SETTINGS mutations_sync=2;
+
+INSERT INTO part_log_bytes_uncompressed SELECT 3, 1 FROM numbers(1000);
+ALTER TABLE part_log_bytes_uncompressed DROP PART 'all_4_4_0' SETTINGS mutations_sync=2;
+
+SYSTEM FLUSH LOGS;
+
+SELECT event_type, table, part_name, bytes_uncompressed > 0, size_in_bytes < bytes_uncompressed FROM system.part_log
+WHERE event_date >= yesterday() AND database = currentDatabase() AND table = 'part_log_bytes_uncompressed'
+ORDER BY part_name, event_type;
+
+DROP TABLE part_log_bytes_uncompressed;
diff --git a/tests/queries/0_stateless/02950_part_offset_as_primary_key.reference b/tests/queries/0_stateless/02950_part_offset_as_primary_key.reference
new file mode 100644
index 00000000000..368f8dd9871
--- /dev/null
+++ b/tests/queries/0_stateless/02950_part_offset_as_primary_key.reference
@@ -0,0 +1,14 @@
+-4
+-3
+-2
+-1
+0
+-3
+0
+-4
+-2
+-1
+0
+10
+40
+400
diff --git a/tests/queries/0_stateless/02950_part_offset_as_primary_key.sql b/tests/queries/0_stateless/02950_part_offset_as_primary_key.sql
new file mode 100644
index 00000000000..736d54023ce
--- /dev/null
+++ b/tests/queries/0_stateless/02950_part_offset_as_primary_key.sql
@@ -0,0 +1,40 @@
+drop table if exists a;
+
+create table a (i int) engine MergeTree order by i settings index_granularity = 2;
+insert into a select -number from numbers(5);
+
+-- nothing to read
+select i from a where _part_offset >= 5 order by i settings max_bytes_to_read = 1;
+
+-- one granule
+select i from a where _part_offset = 0 order by i settings max_rows_to_read = 2;
+select i from a where _part_offset = 1 order by i settings max_rows_to_read = 2;
+select i from a where _part_offset = 2 order by i settings max_rows_to_read = 2;
+select i from a where _part_offset = 3 order by i settings max_rows_to_read = 2;
+select i from a where _part_offset = 4 order by i settings max_rows_to_read = 1;
+
+-- other predicates
+select i from a where _part_offset in (1, 4) order by i settings max_rows_to_read = 3;
+select i from a where _part_offset not in (1, 4) order by i settings max_rows_to_read = 4;
+
+-- the force_primary_key check still works
+select i from a where _part_offset = 4 order by i settings force_primary_key = 1; -- { serverError INDEX_NOT_USED }
+
+-- combining with other primary keys doesn't work (makes no sense)
+select i from a where i = -3 or _part_offset = 4 order by i settings force_primary_key = 1; -- { serverError INDEX_NOT_USED }
+
+drop table a;
+
+drop table if exists b;
+
+create table b (i int) engine MergeTree order by tuple() settings index_granularity = 2;
+
+-- all_1_1_0
+insert into b select number * 10 from numbers(5);
+-- all_2_2_0
+insert into b select number * 100 from numbers(5);
+
+-- multiple parts with _part predicate
+select i from b where (_part = 'all_1_1_0' and _part_offset in (1, 4)) or (_part = 'all_2_2_0' and _part_offset in (0, 4)) order by i settings max_rows_to_read = 6;
+
+drop table b;
diff --git a/tests/queries/0_stateless/02950_reading_array_tuple_subcolumns.reference b/tests/queries/0_stateless/02950_reading_array_tuple_subcolumns.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02950_reading_array_tuple_subcolumns.sql b/tests/queries/0_stateless/02950_reading_array_tuple_subcolumns.sql
new file mode 100644
index 00000000000..85bf16a885b
--- /dev/null
+++ b/tests/queries/0_stateless/02950_reading_array_tuple_subcolumns.sql
@@ -0,0 +1,15 @@
+DROP TABLE IF EXISTS test;
+CREATE TABLE test
+(
+    `id` UInt64,
+    `t` Tuple(a UInt64, b Array(Tuple(c UInt64, d UInt64)))
+)
+ENGINE = MergeTree
+ORDER BY id
+SETTINGS min_rows_for_wide_part = 1, min_bytes_for_wide_part = 1, index_granularity = 8192;
+INSERT INTO test SELECT number, tuple(number, arrayMap(x -> tuple(number + 1, number + 2), range(number % 10))) FROM numbers(100000);
+INSERT INTO test SELECT number, tuple(number, arrayMap(x -> tuple(number + 1, number + 2), range(number % 10))) FROM numbers(100000);
+INSERT INTO test SELECT number, tuple(number, arrayMap(x -> tuple(number + 1, number + 2), range(number % 10))) FROM numbers(100000);
+SELECT t.b, t.b.c FROM test ORDER BY id FORMAT Null;
+DROP TABLE test;
+
diff --git a/tests/queries/0_stateless/02951_data.jsonl.zst b/tests/queries/0_stateless/02951_data.jsonl.zst
new file mode 100644
index 00000000000..9701cdd5f6e
Binary files /dev/null and b/tests/queries/0_stateless/02951_data.jsonl.zst differ
diff --git a/tests/queries/0_stateless/02951_parallel_parsing_json_compact_each_row.reference b/tests/queries/0_stateless/02951_parallel_parsing_json_compact_each_row.reference
new file mode 100644
index 00000000000..0953b633db6
--- /dev/null
+++ b/tests/queries/0_stateless/02951_parallel_parsing_json_compact_each_row.reference
@@ -0,0 +1 @@
+15021837090950060251
diff --git a/tests/queries/0_stateless/02951_parallel_parsing_json_compact_each_row.sh b/tests/queries/0_stateless/02951_parallel_parsing_json_compact_each_row.sh
new file mode 100755
index 00000000000..bdaac0e0c50
--- /dev/null
+++ b/tests/queries/0_stateless/02951_parallel_parsing_json_compact_each_row.sh
@@ -0,0 +1,63 @@
+#!/usr/bin/env bash
+# Tags: no-parallel
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+${CLICKHOUSE_LOCAL} --input-format-parallel-parsing 1 --query "
+    SELECT sum(cityHash64(*)) FROM file('$CUR_DIR/02951_data.jsonl.zst', JSONCompactEachRow, '
+            time_offset Decimal64(3),
+            lat Float64,
+            lon Float64,
+            altitude String,
+            ground_speed Float32,
+            track_degrees Float32,
+            flags UInt32,
+            vertical_rate Int32,
+            aircraft Tuple(
+                alert            Int64,
+                alt_geom         Int64,
+                gva              Int64,
+                nac_p            Int64,
+                nac_v            Int64,
+                nic              Int64,
+                nic_baro         Int64,
+                rc               Int64,
+                sda              Int64,
+                sil              Int64,
+                sil_type         String,
+                spi              Int64,
+                track            Float64,
+                type             String,
+                version          Int64,
+                category         String,
+                emergency        String,
+                flight           String,
+                squawk           String,
+                baro_rate        Int64,
+                nav_altitude_fms Int64,
+                nav_altitude_mcp Int64,
+                nav_modes        Array(String),
+                nav_qnh          Float64,
+                geom_rate        Int64,
+                ias              Int64,
+                mach             Float64,
+                mag_heading      Float64,
+                oat              Int64,
+                roll             Float64,
+                tas              Int64,
+                tat              Int64,
+                true_heading     Float64,
+                wd               Int64,
+                ws               Int64,
+                track_rate       Float64,
+                nav_heading      Float64
+            ),
+            source LowCardinality(String),
+            geometric_altitude Int32,
+            geometric_vertical_rate Int32,
+            indicated_airspeed Int32,
+            roll_angle Float32,
+            hex String
+        ')"
diff --git a/tests/queries/0_stateless/02952_archive_parsing.reference b/tests/queries/0_stateless/02952_archive_parsing.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02952_archive_parsing.sql b/tests/queries/0_stateless/02952_archive_parsing.sql
new file mode 100644
index 00000000000..49b0223e6ec
--- /dev/null
+++ b/tests/queries/0_stateless/02952_archive_parsing.sql
@@ -0,0 +1 @@
+SELECT * FROM file('::a'); -- { serverError BAD_ARGUMENTS }
diff --git a/tests/queries/0_stateless/02952_binary.reference b/tests/queries/0_stateless/02952_binary.reference
new file mode 100644
index 00000000000..8205460df96
--- /dev/null
+++ b/tests/queries/0_stateless/02952_binary.reference
@@ -0,0 +1 @@
+addressToSymbol
diff --git a/tests/queries/0_stateless/02952_binary.sh b/tests/queries/0_stateless/02952_binary.sh
new file mode 100755
index 00000000000..c55df1a80b1
--- /dev/null
+++ b/tests/queries/0_stateless/02952_binary.sh
@@ -0,0 +1,7 @@
+#!/usr/bin/env bash
+
+CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CURDIR"/../shell_config.sh
+
+${CLICKHOUSE_CURL} -s "${CLICKHOUSE_PORT_HTTP_PROTO}://${CLICKHOUSE_HOST}:${CLICKHOUSE_PORT_HTTP}/binary" 2>/dev/null | grep -oF --max-count 1 'addressToSymbol'
diff --git a/tests/queries/0_stateless/02952_clickhouse_local_query_parameters_cli.reference b/tests/queries/0_stateless/02952_clickhouse_local_query_parameters_cli.reference
new file mode 100644
index 00000000000..9972842f982
--- /dev/null
+++ b/tests/queries/0_stateless/02952_clickhouse_local_query_parameters_cli.reference
@@ -0,0 +1 @@
+1	1
diff --git a/tests/queries/0_stateless/02952_clickhouse_local_query_parameters_cli.sh b/tests/queries/0_stateless/02952_clickhouse_local_query_parameters_cli.sh
new file mode 100755
index 00000000000..5e9efbbf3ad
--- /dev/null
+++ b/tests/queries/0_stateless/02952_clickhouse_local_query_parameters_cli.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL --param_x 1 -q "SELECT {x:UInt64}, {x:String};"
diff --git a/tests/queries/0_stateless/02952_conjunction_optimization.reference b/tests/queries/0_stateless/02952_conjunction_optimization.reference
new file mode 100644
index 00000000000..64663cea662
--- /dev/null
+++ b/tests/queries/0_stateless/02952_conjunction_optimization.reference
@@ -0,0 +1,117 @@
+3	another
+3	
+QUERY id: 0
+  PROJECTION COLUMNS
+    a Int32
+    b String
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: a, result_type: Int32, source_id: 3
+      COLUMN id: 4, column_name: b, result_type: String, source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.02952_disjunction_optimization
+  WHERE
+    FUNCTION id: 5, function_name: notIn, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          COLUMN id: 7, column_name: a, result_type: Int32, source_id: 3
+          CONSTANT id: 8, constant_value: Tuple_(UInt64_1, UInt64_2, UInt64_4), constant_value_type: Tuple(UInt8, UInt8, UInt8)
+3	another
+3	
+QUERY id: 0
+  PROJECTION COLUMNS
+    a Int32
+    b String
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: a, result_type: Int32, source_id: 3
+      COLUMN id: 4, column_name: b, result_type: String, source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.02952_disjunction_optimization
+  WHERE
+    FUNCTION id: 5, function_name: and, function_type: ordinary, result_type: Bool
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          CONSTANT id: 7, constant_value: UInt64_1, constant_value_type: Bool
+          FUNCTION id: 8, function_name: notIn, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 9, nodes: 2
+                COLUMN id: 10, column_name: a, result_type: Int32, source_id: 3
+                CONSTANT id: 11, constant_value: Tuple_(UInt64_1, UInt64_2, UInt64_4), constant_value_type: Tuple(UInt8, UInt8, UInt8)
+3	another
+QUERY id: 0
+  PROJECTION COLUMNS
+    a Int32
+    b String
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: a, result_type: Int32, source_id: 3
+      COLUMN id: 4, column_name: b, result_type: String, source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.02952_disjunction_optimization
+  WHERE
+    FUNCTION id: 5, function_name: and, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          FUNCTION id: 7, function_name: notEquals, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 8, nodes: 2
+                COLUMN id: 9, column_name: b, result_type: String, source_id: 3
+                CONSTANT id: 10, constant_value: \'\', constant_value_type: String
+          FUNCTION id: 11, function_name: notIn, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 12, nodes: 2
+                COLUMN id: 13, column_name: a, result_type: Int32, source_id: 3
+                CONSTANT id: 14, constant_value: Tuple_(UInt64_1, UInt64_2, UInt64_4), constant_value_type: Tuple(UInt8, UInt8, UInt8)
+3	
+QUERY id: 0
+  PROJECTION COLUMNS
+    a Int32
+    b String
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: a, result_type: Int32, source_id: 3
+      COLUMN id: 4, column_name: b, result_type: String, source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.02952_disjunction_optimization
+  WHERE
+    FUNCTION id: 5, function_name: and, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          FUNCTION id: 7, function_name: equals, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 8, nodes: 2
+                COLUMN id: 9, column_name: b, result_type: String, source_id: 3
+                CONSTANT id: 10, constant_value: \'\', constant_value_type: String
+          FUNCTION id: 11, function_name: notIn, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 12, nodes: 2
+                COLUMN id: 13, column_name: a, result_type: Int32, source_id: 3
+                CONSTANT id: 14, constant_value: Tuple_(UInt64_1, UInt64_2, UInt64_4), constant_value_type: Tuple(UInt8, UInt8, UInt8)
+3	another
+3	
+4	
+QUERY id: 0
+  PROJECTION COLUMNS
+    a Int32
+    b String
+  PROJECTION
+    LIST id: 1, nodes: 2
+      COLUMN id: 2, column_name: a, result_type: Int32, source_id: 3
+      COLUMN id: 4, column_name: b, result_type: String, source_id: 3
+  JOIN TREE
+    TABLE id: 3, table_name: default.02952_disjunction_optimization
+  WHERE
+    FUNCTION id: 5, function_name: or, function_type: ordinary, result_type: UInt8
+      ARGUMENTS
+        LIST id: 6, nodes: 2
+          FUNCTION id: 7, function_name: notIn, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 8, nodes: 2
+                COLUMN id: 9, column_name: a, result_type: Int32, source_id: 3
+                CONSTANT id: 10, constant_value: Tuple_(UInt64_1, UInt64_2, UInt64_4), constant_value_type: Tuple(UInt8, UInt8, UInt8)
+          FUNCTION id: 11, function_name: equals, function_type: ordinary, result_type: UInt8
+            ARGUMENTS
+              LIST id: 12, nodes: 2
+                COLUMN id: 13, column_name: b, result_type: String, source_id: 3
+                CONSTANT id: 14, constant_value: \'\', constant_value_type: String
diff --git a/tests/queries/0_stateless/02952_conjunction_optimization.sql b/tests/queries/0_stateless/02952_conjunction_optimization.sql
new file mode 100644
index 00000000000..94bc352e4c5
--- /dev/null
+++ b/tests/queries/0_stateless/02952_conjunction_optimization.sql
@@ -0,0 +1,26 @@
+SET allow_experimental_analyzer = 1;
+
+DROP TABLE IF EXISTS 02952_disjunction_optimization;
+
+CREATE TABLE 02952_disjunction_optimization
+(a Int32, b String)
+ENGINE=Memory;
+
+INSERT INTO 02952_disjunction_optimization VALUES (1, 'test'), (2, 'test2'), (3, 'another'), (3, ''), (4, '');
+
+SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND a <> 4;
+EXPLAIN QUERY TREE SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND a <> 4;
+
+SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND a <> 4 AND true;
+EXPLAIN QUERY TREE SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND a <> 4 AND true;
+
+SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND a <> 4 AND b <> '';
+EXPLAIN QUERY TREE SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND a <> 4 AND b <> '';
+
+SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND b = '' AND a <> 4;
+EXPLAIN QUERY TREE SELECT * FROM 02952_disjunction_optimization WHERE a <> 1 AND a <> 2 AND b = '' AND a <> 4;
+
+SELECT * FROM 02952_disjunction_optimization WHERE (a <> 1 AND a <> 2 AND a <> 4) OR b = '';
+EXPLAIN QUERY TREE SELECT * FROM 02952_disjunction_optimization WHERE (a <> 1 AND a <> 2 AND a <> 4) OR b = '';
+
+DROP TABLE 02952_disjunction_optimization;
diff --git a/tests/queries/0_stateless/02953_slow_create_view.reference b/tests/queries/0_stateless/02953_slow_create_view.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02953_slow_create_view.sql b/tests/queries/0_stateless/02953_slow_create_view.sql
new file mode 100644
index 00000000000..7824bd97b92
--- /dev/null
+++ b/tests/queries/0_stateless/02953_slow_create_view.sql
@@ -0,0 +1,44 @@
+drop view if exists slow_view1;
+
+create view slow_view1 as
+with c1 as (select 1 as a),
+    c2 as (select a from c1),
+    c3 as (select a from c2),
+    c4 as (select a from c3),
+    c5 as (select a from c4),
+    c6 as (select a from c5),
+    c7 as (select a from c6),
+    c8 as (select a from c7),
+    c9 as (select a from c8),
+    c10 as (select a from c9),
+    c11 as (select a from c10),
+    c12 as (select a from c11),
+    c13 as (select a from c12),
+    c14 as (select a from c13),
+    c15 as (select a from c14),
+    c16 as (select a from c15),
+    c17 as (select a from c16),
+    c18 as (select a from c17),
+    c19 as (select a from c18),
+    c20 as (select a from c19),
+    c21 as (select a from c20),
+    c22 as (select a from c21),
+    c23 as (select a from c22),
+    c24 as (select a from c23),
+    c25 as (select a from c24),
+    c26 as (select a from c25),
+    c27 as (select a from c26),
+    c28 as (select a from c27),
+    c29 as (select a from c28),
+    c30 as (select a from c29),
+    c31 as (select a from c30),
+    c32 as (select a from c31),
+    c33 as (select a from c32),
+    c34 as (select a from c33),
+    c35 as (select a from c34),
+    c36 as (select a from c35),
+    c37 as (select a from c36),
+    c38 as (select a from c37),
+    c39 as (select a from c38),
+    c40 as (select a from c39)
+select a from c21;
diff --git a/tests/queries/0_stateless/02954_analyzer_fuzz_i57086.reference b/tests/queries/0_stateless/02954_analyzer_fuzz_i57086.reference
new file mode 100644
index 00000000000..f2386499865
--- /dev/null
+++ b/tests/queries/0_stateless/02954_analyzer_fuzz_i57086.reference
@@ -0,0 +1,2 @@
+limit w/ GROUP BY	0	0
+limit w/ GROUP BY	0	0
diff --git a/tests/queries/0_stateless/02954_analyzer_fuzz_i57086.sql b/tests/queries/0_stateless/02954_analyzer_fuzz_i57086.sql
new file mode 100644
index 00000000000..a8029fdd3d6
--- /dev/null
+++ b/tests/queries/0_stateless/02954_analyzer_fuzz_i57086.sql
@@ -0,0 +1,15 @@
+--https://github.com/ClickHouse/ClickHouse/issues/57086
+SELECT
+    'limit w/ GROUP BY',
+    count(NULL),
+    number
+FROM remote('127.{1,2}', view(
+        SELECT intDiv(number, 2147483647) AS number
+        FROM numbers(10)
+    ))
+GROUP BY number
+WITH ROLLUP
+ORDER BY
+    count() ASC,
+    number DESC NULLS LAST
+    SETTINGS limit = 2, allow_experimental_analyzer = 1;
diff --git a/tests/queries/0_stateless/02955_sparkBar_alias_sparkbar.reference b/tests/queries/0_stateless/02955_sparkBar_alias_sparkbar.reference
new file mode 100644
index 00000000000..4600566772a
--- /dev/null
+++ b/tests/queries/0_stateless/02955_sparkBar_alias_sparkbar.reference
@@ -0,0 +1,2 @@
+▂▅▂▃▆█  ▂
+▂▅▂▃▆█  ▂
diff --git a/tests/queries/0_stateless/02955_sparkBar_alias_sparkbar.sql b/tests/queries/0_stateless/02955_sparkBar_alias_sparkbar.sql
new file mode 100644
index 00000000000..98259fc8029
--- /dev/null
+++ b/tests/queries/0_stateless/02955_sparkBar_alias_sparkbar.sql
@@ -0,0 +1,12 @@
+SET allow_experimental_analyzer = 1;
+DROP TABLE IF EXISTS spark_bar_test;
+
+CREATE TABLE spark_bar_test (`value` Int64, `event_date` Date) ENGINE = MergeTree ORDER BY event_date;
+
+INSERT INTO spark_bar_test VALUES (1,'2020-01-01'), (3,'2020-01-02'), (4,'2020-01-02'), (-3,'2020-01-02'), (5,'2020-01-03'), (2,'2020-01-04'), (3,'2020-01-05'), (7,'2020-01-06'), (6,'2020-01-07'), (8,'2020-01-08'), (2,'2020-01-11');
+
+SELECT sparkbar(9)(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_test GROUP BY event_date);
+SELECT sparkBar(9)(event_date,cnt) FROM (SELECT sum(value) as cnt, event_date FROM spark_bar_test GROUP BY event_date);
+
+DROP TABLE IF EXISTS spark_bar_test;
+
diff --git a/tests/queries/0_stateless/02956_clickhouse_local_system_parts.reference b/tests/queries/0_stateless/02956_clickhouse_local_system_parts.reference
new file mode 100644
index 00000000000..30365d83930
--- /dev/null
+++ b/tests/queries/0_stateless/02956_clickhouse_local_system_parts.reference
@@ -0,0 +1 @@
+test	all_1_1_0	1
diff --git a/tests/queries/0_stateless/02956_clickhouse_local_system_parts.sh b/tests/queries/0_stateless/02956_clickhouse_local_system_parts.sh
new file mode 100755
index 00000000000..e9d8eb081fb
--- /dev/null
+++ b/tests/queries/0_stateless/02956_clickhouse_local_system_parts.sh
@@ -0,0 +1,8 @@
+#!/usr/bin/env bash
+# Tags: no-fasttest
+
+CUR_DIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
+# shellcheck source=../shell_config.sh
+. "$CUR_DIR"/../shell_config.sh
+
+$CLICKHOUSE_LOCAL --multiquery "CREATE TABLE test (x UInt8) ENGINE = MergeTree ORDER BY (); INSERT INTO test SELECT 1; SELECT table, name, rows FROM system.parts WHERE database = currentDatabase();"
diff --git a/tests/queries/0_stateless/02956_format_constexpr.reference b/tests/queries/0_stateless/02956_format_constexpr.reference
new file mode 100644
index 00000000000..d00491fd7e5
--- /dev/null
+++ b/tests/queries/0_stateless/02956_format_constexpr.reference
@@ -0,0 +1 @@
+1
diff --git a/tests/queries/0_stateless/02956_format_constexpr.sql b/tests/queries/0_stateless/02956_format_constexpr.sql
new file mode 100644
index 00000000000..32c61436306
--- /dev/null
+++ b/tests/queries/0_stateless/02956_format_constexpr.sql
@@ -0,0 +1 @@
+SELECT isConstant(format('{}, world', 'Hello'));
diff --git a/tests/queries/0_stateless/02958_transform_enum.reference b/tests/queries/0_stateless/02958_transform_enum.reference
new file mode 100644
index 00000000000..4c1476a8922
--- /dev/null
+++ b/tests/queries/0_stateless/02958_transform_enum.reference
@@ -0,0 +1,4 @@
+Hello	123
+world	456
+Hello	test
+world	best
diff --git a/tests/queries/0_stateless/02958_transform_enum.sql b/tests/queries/0_stateless/02958_transform_enum.sql
new file mode 100644
index 00000000000..3b0fd40a282
--- /dev/null
+++ b/tests/queries/0_stateless/02958_transform_enum.sql
@@ -0,0 +1,3 @@
+WITH arrayJoin(['Hello', 'world'])::Enum('Hello', 'world') AS x SELECT x, transform(x, ['Hello', 'world'], [123, 456], 0);
+WITH arrayJoin(['Hello', 'world'])::Enum('Hello', 'world') AS x SELECT x, transform(x, ['Hello', 'world', 'goodbye'], [123, 456], 0); -- { serverError UNKNOWN_ELEMENT_OF_ENUM }
+WITH arrayJoin(['Hello', 'world'])::Enum('Hello', 'world') AS x SELECT x, transform(x, ['Hello', 'world'], ['test', 'best']::Array(Enum('test' = 123, 'best' = 456, '' = 0)), ''::Enum('test' = 123, 'best' = 456, '' = 0)) AS y;
diff --git a/tests/queries/0_stateless/02959_system_database_engines.reference b/tests/queries/0_stateless/02959_system_database_engines.reference
new file mode 100644
index 00000000000..c3cc6fe7c9d
--- /dev/null
+++ b/tests/queries/0_stateless/02959_system_database_engines.reference
@@ -0,0 +1,3 @@
+Atomic
+Lazy
+Ordinary
diff --git a/tests/queries/0_stateless/02959_system_database_engines.sql b/tests/queries/0_stateless/02959_system_database_engines.sql
new file mode 100644
index 00000000000..67cb20f0400
--- /dev/null
+++ b/tests/queries/0_stateless/02959_system_database_engines.sql
@@ -0,0 +1 @@
+SELECT * FROM system.database_engines WHERE name IN ('Atomic', 'Lazy', 'Ordinary') ORDER BY name;
diff --git a/tests/queries/0_stateless/02960_partition_by_udf.reference b/tests/queries/0_stateless/02960_partition_by_udf.reference
new file mode 100644
index 00000000000..f599e28b8ab
--- /dev/null
+++ b/tests/queries/0_stateless/02960_partition_by_udf.reference
@@ -0,0 +1 @@
+10
diff --git a/tests/queries/0_stateless/02960_partition_by_udf.sql b/tests/queries/0_stateless/02960_partition_by_udf.sql
new file mode 100644
index 00000000000..3a5b7491694
--- /dev/null
+++ b/tests/queries/0_stateless/02960_partition_by_udf.sql
@@ -0,0 +1,19 @@
+-- Tags: no-parallel
+
+DROP FUNCTION IF EXISTS f1;
+CREATE FUNCTION f1 AS (x) -> x;
+
+CREATE TABLE hit
+(
+  `UserID` UInt32,
+  `URL` String,
+  `EventTime` DateTime
+)
+ENGINE = MergeTree
+partition by f1(URL)
+ORDER BY (EventTime);
+
+INSERT INTO hit SELECT * FROM generateRandom() LIMIT 10;
+SELECT count() FROM hit;
+
+DROP TABLE hit;
diff --git a/tests/queries/0_stateless/02960_validate_database_engines.reference b/tests/queries/0_stateless/02960_validate_database_engines.reference
new file mode 100644
index 00000000000..e69de29bb2d
diff --git a/tests/queries/0_stateless/02960_validate_database_engines.sql b/tests/queries/0_stateless/02960_validate_database_engines.sql
new file mode 100644
index 00000000000..5d39a76867c
--- /dev/null
+++ b/tests/queries/0_stateless/02960_validate_database_engines.sql
@@ -0,0 +1,14 @@
+-- Tags: no-parallel
+
+DROP DATABASE IF EXISTS test2960_valid_database_engine;
+
+-- create database with valid engine. Should succeed.
+CREATE DATABASE test2960_valid_database_engine ENGINE = Atomic;
+
+-- create database with valid engine but arguments are not allowed. Should fail.
+CREATE DATABASE test2960_database_engine_args_not_allowed ENGINE = Atomic('foo', 'bar'); -- { serverError BAD_ARGUMENTS }
+
+-- create database with an invalid engine. Should fail.
+CREATE DATABASE test2960_invalid_database_engine ENGINE = Foo; -- { serverError UNKNOWN_DATABASE_ENGINE }
+
+DROP DATABASE IF EXISTS test2960_valid_database_engine;
diff --git a/tests/queries/0_stateless/replication.lib b/tests/queries/0_stateless/replication.lib
index 56ec6c18a1f..143332d9974 100755
--- a/tests/queries/0_stateless/replication.lib
+++ b/tests/queries/0_stateless/replication.lib
@@ -60,21 +60,11 @@ function check_replication_consistency()
             echo "==================== STACK  TRACES ===================="
             $CLICKHOUSE_CLIENT -q "SELECT query_id, thread_name, thread_id, arrayStringConcat(arrayMap(x -> demangle(addressToSymbol(x)), trace), '\n') FROM system.stack_trace where query_id IN (SELECT query_id FROM system.processes WHERE current_database=currentDatabase() AND query LIKE '%$table_name_prefix%') SETTINGS allow_introspection_functions=1 FORMAT Vertical"
             echo "==================== MUTATIONS ===================="
-            $CLICKHOUSE_CLIENT -q "SELECT * FROM system.mutations WHERE current_database=currentDatabase() FORMAT Vertical"
+            $CLICKHOUSE_CLIENT -q "SELECT * FROM system.mutations WHERE database=currentDatabase() FORMAT Vertical"
             break
         fi
     done
 
-    # Touch all data to check that it's readable (and trigger PartCheckThread if needed)
-    while ! $CLICKHOUSE_CLIENT -q "SELECT * FROM merge(currentDatabase(), '$table_name_prefix') FORMAT Null" 2>/dev/null; do
-        sleep 1;
-        num_tries=$((num_tries+1))
-        if [ $num_tries -eq 250 ]; then
-            break
-        fi
-    done
-    time_left=$((300 - num_tries))
-
     # Do not check anything if all replicas are readonly,
     # because is this case all replicas are probably lost (it may happen and it's not a bug)
     res=$($CLICKHOUSE_CLIENT -q "SELECT count() - sum(is_readonly) FROM system.replicas WHERE database=currentDatabase() AND table LIKE '$table_name_prefix%'")
@@ -85,6 +75,16 @@ function check_replication_consistency()
         return 0
     fi
 
+    # Touch all data to check that it's readable (and trigger PartCheckThread if needed)
+    while ! $CLICKHOUSE_CLIENT -q "SELECT * FROM merge(currentDatabase(), '$table_name_prefix') FORMAT Null" 2>/dev/null; do
+        sleep 1;
+        num_tries=$((num_tries+1))
+        if [ $num_tries -eq 250 ]; then
+            break
+        fi
+    done
+    time_left=$((300 - num_tries))
+
     # Trigger pullLogsToQueue(...) and updateMutations(...) on some replica to make it pull all mutations, so it will be possible to kill them
     some_table=$($CLICKHOUSE_CLIENT -q "SELECT name FROM system.tables WHERE database=currentDatabase() AND name like '$table_name_prefix%' ORDER BY rand() LIMIT 1")
     $CLICKHOUSE_CLIENT -q "SYSTEM SYNC REPLICA $some_table PULL" 1>/dev/null 2>/dev/null ||:
diff --git a/tests/queries/1_stateful/00165_jit_aggregate_functions.sql b/tests/queries/1_stateful/00165_jit_aggregate_functions.sql
index c826a129b2a..157d5892ad8 100644
--- a/tests/queries/1_stateful/00165_jit_aggregate_functions.sql
+++ b/tests/queries/1_stateful/00165_jit_aggregate_functions.sql
@@ -1,5 +1,6 @@
 SET compile_aggregate_expressions = 1;
 SET min_count_to_compile_aggregate_expression = 0;
+SET max_bytes_before_external_group_by='200M'; -- might be randomized to 1 leading to timeout
 
 SELECT 'Aggregation using JIT compilation';
 
diff --git a/tests/queries/1_stateful/00172_hits_joins.sql.j2 b/tests/queries/1_stateful/00172_hits_joins.sql.j2
index 4617fe5aef8..e891f1ba3c3 100644
--- a/tests/queries/1_stateful/00172_hits_joins.sql.j2
+++ b/tests/queries/1_stateful/00172_hits_joins.sql.j2
@@ -4,6 +4,9 @@
 SET max_rows_in_join = '{% if join_algorithm == 'grace_hash' %}10K{% else %}0{% endif %}';
 SET grace_hash_join_initial_buckets = 4;
 
+-- Test is slow with external sort / group by
+SET max_bytes_before_external_sort = 0, max_bytes_before_external_group_by = 0;
+
 SELECT '--- {{ join_algorithm }} ---';
 
 SET join_algorithm = '{{ join_algorithm }}';
diff --git a/tests/queries/1_stateful/00177_memory_bound_merging.sh b/tests/queries/1_stateful/00177_memory_bound_merging.sh
index ce889b338d6..d5cd1a05cd8 100755
--- a/tests/queries/1_stateful/00177_memory_bound_merging.sh
+++ b/tests/queries/1_stateful/00177_memory_bound_merging.sh
@@ -31,7 +31,7 @@ test1() {
         GROUP BY CounterID, URL, EventDate
         ORDER BY URL, EventDate
         LIMIT 5 OFFSET 10
-        SETTINGS optimize_aggregation_in_order = 1, enable_memory_bound_merging_of_aggregation_results = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, max_parallel_replicas = 3, use_hedged_requests = 0"
+        SETTINGS optimize_aggregation_in_order = 1, enable_memory_bound_merging_of_aggregation_results = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, max_parallel_replicas = 3"
     check_replicas_read_in_order $query_id
 }
 
@@ -48,7 +48,7 @@ test2() {
         GROUP BY URL, EventDate
         ORDER BY URL, EventDate
         LIMIT 5 OFFSET 10
-        SETTINGS optimize_aggregation_in_order = 1, enable_memory_bound_merging_of_aggregation_results = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, max_parallel_replicas = 3, use_hedged_requests = 0, query_plan_aggregation_in_order = 1"
+        SETTINGS optimize_aggregation_in_order = 1, enable_memory_bound_merging_of_aggregation_results = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, max_parallel_replicas = 3, query_plan_aggregation_in_order = 1"
     check_replicas_read_in_order $query_id
 }
 
@@ -64,7 +64,7 @@ test3() {
             FROM test.hits
             WHERE CounterID = 1704509 AND UserID = 4322253409885123546
             GROUP BY URL, EventDate
-            SETTINGS optimize_aggregation_in_order = 1, enable_memory_bound_merging_of_aggregation_results = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, max_parallel_replicas = 3, use_hedged_requests = 0
+            SETTINGS optimize_aggregation_in_order = 1, enable_memory_bound_merging_of_aggregation_results = 1, allow_experimental_parallel_reading_from_replicas = 1, parallel_replicas_for_non_replicated_merge_tree = 1, max_parallel_replicas = 3
         )
         WHERE explain LIKE '%Aggr%Transform%' OR explain LIKE '%InOrder%'"
 }
diff --git a/tests/queries/1_stateful/00180_no_seek_avoiding_when_reading_from_cache.sh b/tests/queries/1_stateful/00180_no_seek_avoiding_when_reading_from_cache.sh
deleted file mode 100755
index 2e1b807c496..00000000000
--- a/tests/queries/1_stateful/00180_no_seek_avoiding_when_reading_from_cache.sh
+++ /dev/null
@@ -1,36 +0,0 @@
-#!/usr/bin/env bash
-
-# Tags: no-parallel, no-random-settings, long
-
-CURDIR=$(cd "$(dirname "${BASH_SOURCE[0]}")" && pwd)
-# shellcheck source=../shell_config.sh
-. "$CURDIR"/../shell_config.sh
-
-
-# Test assumes that the whole table is residing in the cache, but `hits_s3` has only 128Mi of cache.
-# So we need to create a smaller table.
-$CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS hits_s3_sampled"
-$CLICKHOUSE_CLIENT -q "CREATE TABLE hits_s3_sampled AS test.hits_s3"
-$CLICKHOUSE_CLIENT -q "INSERT INTO hits_s3_sampled SELECT * FROM test.hits_s3 SAMPLE 0.01"
-$CLICKHOUSE_CLIENT -q "OPTIMIZE TABLE hits_s3_sampled FINAL"
-
-$CLICKHOUSE_CLIENT -q "SYSTEM DROP FILESYSTEM CACHE"
-
-# Warm up the cache
-$CLICKHOUSE_CLIENT -q "SELECT * FROM hits_s3_sampled WHERE URL LIKE '%google%' ORDER BY EventTime LIMIT 10 FORMAT Null"
-$CLICKHOUSE_CLIENT -q "SELECT * FROM hits_s3_sampled WHERE URL LIKE '%google%' ORDER BY EventTime LIMIT 10 FORMAT Null"
-
-query_id=02906_read_from_cache_$RANDOM
-$CLICKHOUSE_CLIENT --query_id ${query_id} -q "SELECT * FROM hits_s3_sampled WHERE URL LIKE '%google%' ORDER BY EventTime LIMIT 10 FORMAT Null"
-
-$CLICKHOUSE_CLIENT -nq "
-  SYSTEM FLUSH LOGS;
-
-  -- AsynchronousReaderIgnoredBytes = 0: no seek-avoiding happened
-  -- CachedReadBufferReadFromSourceBytes = 0: sanity check to ensure we read only from cache
-  SELECT ProfileEvents['AsynchronousReaderIgnoredBytes'], ProfileEvents['CachedReadBufferReadFromSourceBytes']
-  FROM system.query_log
-  WHERE query_id = '$query_id' AND type = 'QueryFinish' AND event_date >= yesterday() AND current_database = currentDatabase()
-"
-
-$CLICKHOUSE_CLIENT -q "DROP TABLE IF EXISTS hits_s3_sampled"
diff --git a/tests/queries/shell_config.sh b/tests/queries/shell_config.sh
index 4f28956b91c..c687a63623f 100644
--- a/tests/queries/shell_config.sh
+++ b/tests/queries/shell_config.sh
@@ -39,10 +39,15 @@ export CLICKHOUSE_LOCAL=${CLICKHOUSE_LOCAL:="${CLICKHOUSE_BINARY}-local"}
 [ -x "${CLICKHOUSE_BINARY}-server" ] && CLICKHOUSE_SERVER_BINARY=${CLICKHOUSE_SERVER_BINARY:="${CLICKHOUSE_BINARY}-server"}
 [ -x "${CLICKHOUSE_BINARY}" ] && CLICKHOUSE_SERVER_BINARY=${CLICKHOUSE_SERVER_BINARY:="${CLICKHOUSE_BINARY} server"}
 export CLICKHOUSE_SERVER_BINARY=${CLICKHOUSE_SERVER_BINARY:="${CLICKHOUSE_BINARY}-server"}
+# benchmark
+[ -x "${CLICKHOUSE_BINARY}-benchmark" ] && CLICKHOUSE_BENCHMARK_BINARY=${CLICKHOUSE_BENCHMARK_BINARY:="${CLICKHOUSE_BINARY}-benchmark"}
+[ -x "${CLICKHOUSE_BINARY}" ] && CLICKHOUSE_BENCHMARK_BINARY=${CLICKHOUSE_BENCHMARK_BINARY:="${CLICKHOUSE_BINARY} benchmark"}
+export CLICKHOUSE_BENCHMARK_BINARY="${CLICKHOUSE_BENCHMARK_BINARY:=${CLICKHOUSE_BINARY}-benchmark}"
+export CLICKHOUSE_BENCHMARK_OPT="${CLICKHOUSE_BENCHMARK_OPT0:-} ${CLICKHOUSE_BENCHMARK_OPT:-}"
+export CLICKHOUSE_BENCHMARK=${CLICKHOUSE_BENCHMARK:="$CLICKHOUSE_BENCHMARK_BINARY ${CLICKHOUSE_BENCHMARK_OPT:-}"}
 # others
 export CLICKHOUSE_OBFUSCATOR=${CLICKHOUSE_OBFUSCATOR:="${CLICKHOUSE_BINARY}-obfuscator"}
 export CLICKHOUSE_COMPRESSOR=${CLICKHOUSE_COMPRESSOR:="${CLICKHOUSE_BINARY}-compressor"}
-export CLICKHOUSE_BENCHMARK=${CLICKHOUSE_BENCHMARK:="${CLICKHOUSE_BINARY}-benchmark ${CLICKHOUSE_BENCHMARK_OPT0:-}"}
 export CLICKHOUSE_GIT_IMPORT=${CLICKHOUSE_GIT_IMPORT="${CLICKHOUSE_BINARY}-git-import"}
 
 export CLICKHOUSE_CONFIG=${CLICKHOUSE_CONFIG:="/etc/clickhouse-server/config.xml"}
@@ -81,7 +86,7 @@ export CLICKHOUSE_PORT_KEEPER=${CLICKHOUSE_PORT_KEEPER:="9181"}
 
 # keeper-client
 [ -x "${CLICKHOUSE_BINARY}-keeper-client" ] && CLICKHOUSE_KEEPER_CLIENT=${CLICKHOUSE_KEEPER_CLIENT:="${CLICKHOUSE_BINARY}-keeper-client"}
-[ -x "${CLICKHOUSE_BINARY}" ] && CLICKHOUSE_KEEPER_CLIENT=${CLICKHOUSE_KEEPER_CLIENT:="${CLICKHOUSE_BINARY} keeper-client"}
+[ -x "${CLICKHOUSE_BINARY}" ] && CLICKHOUSE_KEEPER_CLIENT=${CLICKHOUSE_KEEPER_CLIENT:="${CLICKHOUSE_BINARY} keeper-client --port $CLICKHOUSE_PORT_KEEPER"}
 export CLICKHOUSE_KEEPER_CLIENT=${CLICKHOUSE_KEEPER_CLIENT:="${CLICKHOUSE_BINARY}-keeper-client --port $CLICKHOUSE_PORT_KEEPER"}
 
 export CLICKHOUSE_CLIENT_SECURE=${CLICKHOUSE_CLIENT_SECURE:=$(echo "${CLICKHOUSE_CLIENT}" | sed 's/--secure //' | sed 's/'"--port=${CLICKHOUSE_PORT_TCP}"'//g; s/$/'"--secure --accept-invalid-certificate --port=${CLICKHOUSE_PORT_TCP_SECURE}"'/g')}
diff --git a/tests/sqllogic/connection.py b/tests/sqllogic/connection.py
index a49e8f5c62f..2d5e1f8a9e9 100644
--- a/tests/sqllogic/connection.py
+++ b/tests/sqllogic/connection.py
@@ -248,7 +248,7 @@ class ExecResult:
 
     def as_ok(self, rows=None, description=None):
         if rows is None:
-            self._result = True
+            self._result = []
             return self
         self._result = rows
         self._description = description
diff --git a/tests/sqllogic/test_parser.py b/tests/sqllogic/test_parser.py
index f6ad955e7b0..cb1144d7dd9 100755
--- a/tests/sqllogic/test_parser.py
+++ b/tests/sqllogic/test_parser.py
@@ -8,6 +8,8 @@ from itertools import chain
 from enum import Enum
 from hashlib import md5
 from functools import reduce
+import sqlglot
+from sqlglot.expressions import PrimaryKeyColumnConstraint, ColumnDef
 
 from exceptions import (
     Error,
@@ -134,6 +136,41 @@ class FileBlockBase:
         result = test_file.get_tokens(start, result_end)
         return result, result_end
 
+    @staticmethod
+    def convert_request(sql):
+        if sql.startswith("CREATE TABLE"):
+            result = sqlglot.transpile(sql, read="sqlite", write="clickhouse")[0]
+            pk_token = sqlglot.parse_one(result, read="clickhouse").find(
+                PrimaryKeyColumnConstraint
+            )
+            pk_string = "tuple()"
+            if pk_token is not None:
+                pk_string = str(pk_token.find_ancestor(ColumnDef).args["this"])
+
+            result += " ENGINE = MergeTree() ORDER BY " + pk_string
+            return result
+        elif "SELECT" in sql and "CAST" in sql and "NULL" in sql:
+            # convert `CAST (NULL as INTEGER)` to `CAST (NULL as Nullable(Int32))`
+            try:
+                ast = sqlglot.parse_one(sql, read="sqlite")
+            except sqlglot.errors.ParseError as err:
+                logger.info("cannot parse %s , error is %s", sql, err)
+                return sql
+            cast = ast.find(sqlglot.expressions.Cast)
+            # logger.info("found sql %s && %s && %s", sql, cast.sql(), cast.to.args)
+            if (
+                cast is not None
+                and cast.name == "NULL"
+                and ("nested" not in cast.to.args or not cast.to.args["nested"])
+            ):
+                cast.args["to"] = sqlglot.expressions.DataType.build(
+                    "NULLABLE", expressions=[cast.to]
+                )
+                new_sql = ast.sql("clickhouse")
+                # logger.info("convert from %s to %s", sql, new_sql)
+                return new_sql
+        return sql
+
     @staticmethod
     def parse_block(parser, start, end):
         file_pos = FileAndPos(parser.get_test_name(), start + 1)
@@ -169,6 +206,8 @@ class FileBlockBase:
                 request, last_line = FileBlockBase.__parse_request(
                     parser, line + 1, end
                 )
+                if parser.dbms_name == "ClickHouse":
+                    request = FileBlockBase.convert_request(request)
                 assert last_line == end
                 line = last_line
 
@@ -179,6 +218,8 @@ class FileBlockBase:
                 request, last_line = FileBlockBase.__parse_request(
                     parser, line + 1, end
                 )
+                if parser.dbms_name == "ClickHouse":
+                    request = FileBlockBase.convert_request(request)
                 result_line = last_line
                 line = last_line
                 if line == end:
@@ -325,10 +366,11 @@ class TestFileParser:
 
     DEFAULT_HASH_THRESHOLD = 8
 
-    def __init__(self, stream, test_name, test_file):
+    def __init__(self, stream, test_name, test_file, dbms_name):
         self._stream = stream
         self._test_name = test_name
         self._test_file = test_file
+        self.dbms_name = dbms_name
 
         self._lines = []
         self._raw_tokens = []
@@ -500,9 +542,15 @@ class QueryResult:
                     try:
                         res_row.append(str(int(c)))
                     except ValueError as ex:
+                        # raise QueryExecutionError(
+                        #     f"Got non-integer result '{c}' for I type."
+                        # )
+                        res_row.append(str(int(0)))
+                    except OverflowError as ex:
                         raise QueryExecutionError(
-                            f"Got non-integer result '{c}' for I type."
+                            f"Got overflowed result '{c}' for I type."
                         )
+
                 elif t == "R":
                     res_row.append(f"{c:.3f}")
 
diff --git a/tests/sqllogic/test_runner.py b/tests/sqllogic/test_runner.py
index f9ed23566b4..baec0dc7924 100644
--- a/tests/sqllogic/test_runner.py
+++ b/tests/sqllogic/test_runner.py
@@ -530,11 +530,22 @@ class TestRunner:
         if self.results is None:
             self.results = dict()
 
+        if self.dbms_name == "ClickHouse" and test_name in [
+            "test/select5.test",
+            "test/evidence/slt_lang_createtrigger.test",
+            "test/evidence/slt_lang_replace.test",
+            "test/evidence/slt_lang_droptrigger.test",
+        ]:
+            logger.info(f"Let's skip test %s for ClickHouse", test_name)
+            return
+
         with self.connection.with_one_test_scope():
             out_stream = io.StringIO()
             self.results[test_name] = out_stream
 
-            parser = test_parser.TestFileParser(stream, test_name, test_file)
+            parser = test_parser.TestFileParser(
+                stream, test_name, test_file, self.dbms_name
+            )
             for status in self.__statuses(parser, out_stream):
                 self.report.update(status)
 
diff --git a/utils/async_loader_graph b/utils/async_loader_graph
index 5bd4aba41ee..9c055dfa86e 100755
--- a/utils/async_loader_graph
+++ b/utils/async_loader_graph
@@ -3,7 +3,7 @@ set -e
 
 if [ "$1" == "--help" ] || [ -z "$1" ]; then
     cat <<EOF >&2
-SELECT data from 'system.async_loader' table and render .svg graph of load jobs using 'dot' graphviz tool.
+SELECT data from 'system.asynchronous_loader' table and render .svg graph of load jobs using 'dot' graphviz tool.
 USAGE: async_loader_graph CLICKHOUSE_CLIENT CLIENT_OPTIONS
 EXAMPLES:
   $ async_loader_graph clickhouse-client > async_loader.svg
@@ -18,7 +18,7 @@ CLICKHOUSE_CLIENT="$@"
 echo 'digraph {'
 echo 'rankdir=LR;'
 
-$CLICKHOUSE_CLIENT --query='select job, job_id, status, is_blocked, is_ready, is_executing, pool, dependencies from system.async_loader FORMAT JSON' \
+$CLICKHOUSE_CLIENT --query='select job, job_id, status, is_blocked, is_ready, is_executing, pool, dependencies from system.asynchronous_loader FORMAT JSON' \
     | jq -r '
         .data[]
             | { "FgLoad": "box", "BgLoad": "hexagon", "BgStartup": "ellipse" } as $shape
diff --git a/utils/backupview/clickhouse_backupview.py b/utils/backupview/clickhouse_backupview.py
index c9eac87f0ae..4ba1f391d02 100755
--- a/utils/backupview/clickhouse_backupview.py
+++ b/utils/backupview/clickhouse_backupview.py
@@ -1256,7 +1256,7 @@ class S3URI:
         host = parsed_url.netloc
         if host.find(".s3") == -1:
             return False
-        self.bucket, new_host = path.split(".s3", maxsplit=1)
+        self.bucket, new_host = host.split(".s3", maxsplit=1)
         if len(self.bucket) < 3:
             return False
         new_host = "s3" + new_host
diff --git a/utils/check-style/aspell-ignore/en/aspell-dict.txt b/utils/check-style/aspell-ignore/en/aspell-dict.txt
index cbfa70eff32..d68330771e5 100644
--- a/utils/check-style/aspell-ignore/en/aspell-dict.txt
+++ b/utils/check-style/aspell-ignore/en/aspell-dict.txt
@@ -1,4 +1,4 @@
-personal_ws-1.1 en 2646
+personal_ws-1.1 en 2657 
 AArch
 ACLs
 ALTERs
@@ -30,6 +30,7 @@ AppleClang
 Approximative
 ArrayJoin
 ArrowStream
+AsyncInsertCacheSize
 AsynchronousHeavyMetricsCalculationTimeSpent
 AsynchronousHeavyMetricsUpdateInterval
 AsynchronousInsert
@@ -38,11 +39,6 @@ AsynchronousInsertThreadsActive
 AsynchronousMetricsCalculationTimeSpent
 AsynchronousMetricsUpdateInterval
 AsynchronousReadWait
-AsyncInsertCacheSize
-TablesLoaderBackgroundThreads
-TablesLoaderBackgroundThreadsActive
-TablesLoaderForegroundThreads
-TablesLoaderForegroundThreadsActive
 Authenticator
 Authenticators
 AutoFDO
@@ -506,6 +502,7 @@ Memcheck
 MemoryCode
 MemoryDataAndStack
 MemoryResident
+MemoryResidentMax
 MemorySanitizer
 MemoryShared
 MemoryTracking
@@ -704,6 +701,8 @@ PrettySpaceMonoBlock
 PrettySpaceNoEscapes
 PrettySpaceNoEscapesMonoBlock
 Prewhere
+TotalPrimaryKeyBytesInMemory
+TotalPrimaryKeyBytesInMemoryAllocated
 PrivateKeyPassphraseHandler
 ProfileEvents
 Profiler
@@ -754,6 +753,7 @@ Redash
 Reddit
 Refactorings
 ReferenceKeyed
+Refreshable
 RegexpTree
 RemoteRead
 ReplacingMergeTree
@@ -872,11 +872,11 @@ TCPConnection
 TCPThreads
 TDigest
 TINYINT
-TKSV
 TLSv
 TPCH
 TSDB
 TSVRaw
+TSVWithNames
 TSVs
 TSan
 TThe
@@ -888,6 +888,10 @@ TabSeparatedRawWithNamesAndTypes
 TabSeparatedWithNames
 TabSeparatedWithNamesAndTypes
 Tabix
+TablesLoaderBackgroundThreads
+TablesLoaderBackgroundThreadsActive
+TablesLoaderForegroundThreads
+TablesLoaderForegroundThreadsActive
 TablesToDropQueueSize
 TargetSpecific
 Telegraf
@@ -1234,6 +1238,7 @@ changelogs
 charset
 charsets
 chconn
+cheatsheet
 checkouting
 checksummed
 checksumming
@@ -1542,7 +1547,6 @@ geohashEncode
 geohashesInBox
 geoip
 geospatial
-getClientHTTPHeader
 getMacro
 getOSKernelVersion
 getServerPort
@@ -1573,7 +1577,6 @@ groupArrayLast
 groupArrayMovingAvg
 groupArrayMovingSum
 groupArraySample
-groupArraySorted
 groupBitAnd
 groupBitOr
 groupBitXor
@@ -1588,7 +1591,6 @@ grouparraylast
 grouparraymovingavg
 grouparraymovingsum
 grouparraysample
-grouparraysorted
 groupbitand
 groupbitmap
 groupbitmapand
@@ -1852,6 +1854,8 @@ mininum
 miniselect
 minmap
 minmax
+minSampleSizeContinuous
+minSampleSizeConversion
 mins
 misconfiguration
 mispredictions
@@ -2149,6 +2153,7 @@ reddit
 redis
 redisstreams
 refcounter
+refreshable
 regexpExtract
 regexpQuoteMeta
 regionHierarchy
@@ -2193,8 +2198,6 @@ retentions
 rethrow
 retransmit
 retriable
-retuned
-reverseDNSQuery
 reverseUTF
 rightPad
 rightPadUTF
diff --git a/utils/check-style/check-style b/utils/check-style/check-style
index 39d371e25d5..88b43afff26 100755
--- a/utils/check-style/check-style
+++ b/utils/check-style/check-style
@@ -429,3 +429,6 @@ join -v1 <(find $ROOT_PATH/{src,programs,utils} -name '*.h' -printf '%f\n' | sor
 
 # Don't allow dynamic compiler check with CMake, because we are using hermetic, reproducible, cross-compiled, static (TLDR, good) builds.
 ls -1d $ROOT_PATH/contrib/*-cmake | xargs -I@ find @ -name 'CMakeLists.txt' -or -name '*.cmake' | xargs grep --with-filename -i -P 'check_c_compiler_flag|check_cxx_compiler_flag|check_c_source_compiles|check_cxx_source_compiles|check_include_file|check_symbol_exists|cmake_push_check_state|cmake_pop_check_state|find_package|CMAKE_REQUIRED_FLAGS|CheckIncludeFile|CheckCCompilerFlag|CheckCXXCompilerFlag|CheckCSourceCompiles|CheckCXXSourceCompiles|CheckCSymbolExists|CheckCXXSymbolExists' | grep -v Rust && echo "^ It's not allowed to have dynamic compiler checks with CMake."
+
+# DOS/Windows newlines
+find $ROOT_PATH/{base,src,programs,utils,docs} -name '*.md' -or -name '*.h' -or -name '*.cpp' -or -name '*.js' -or -name '*.py' -or -name '*.html' | xargs grep -l -P '\r$' && echo "^ Files contain DOS/Windows newlines (\r\n instead of \n)."
diff --git a/utils/check-style/check-typos b/utils/check-style/check-typos
index 9194a9464a7..0486efb37b1 100755
--- a/utils/check-style/check-typos
+++ b/utils/check-style/check-typos
@@ -4,6 +4,7 @@
 
 ROOT_PATH=$(git rev-parse --show-toplevel)
 
+#FIXME: check all (or almost all) repo
 codespell \
     --skip "*generated*,*gperf*,*.bin,*.mrk*,*.idx,checksums.txt,*.dat,*.pyc,*.kate-swp,*obfuscateQueries.cpp,d3-*.js,*.min.js,*.sum,${ROOT_PATH}/utils/check-style/aspell-ignore" \
     --ignore-words "${ROOT_PATH}/utils/check-style/codespell-ignore-words.list" \
diff --git a/utils/keeper-bench/Runner.cpp b/utils/keeper-bench/Runner.cpp
index 611ca948c53..a4b579f1f7b 100644
--- a/utils/keeper-bench/Runner.cpp
+++ b/utils/keeper-bench/Runner.cpp
@@ -174,7 +174,7 @@ void Runner::thread(std::vector<std::shared_ptr<Coordination::ZooKeeper>> zookee
         || sigaddset(&sig_set, SIGINT)
         || pthread_sigmask(SIG_BLOCK, &sig_set, nullptr))
     {
-        DB::throwFromErrno("Cannot block signal.", DB::ErrorCodes::CANNOT_BLOCK_SIGNAL);
+        throw DB::ErrnoException(DB::ErrorCodes::CANNOT_BLOCK_SIGNAL, "Cannot block signal");
     }
 
     while (true)
diff --git a/utils/list-versions/version_date.tsv b/utils/list-versions/version_date.tsv
index ebe138d597a..53ad807c44b 100644
--- a/utils/list-versions/version_date.tsv
+++ b/utils/list-versions/version_date.tsv
@@ -1,3 +1,7 @@
+v23.12.1.1368-stable	2023-12-28
+v23.11.3.23-stable	2023-12-21
+v23.11.2.11-stable	2023-12-13
+v23.11.1.2711-stable	2023-12-06
 v23.10.5.20-stable	2023-11-25
 v23.10.4.25-stable	2023-11-17
 v23.10.3.5-stable	2023-11-10